beam-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From echauc...@apache.org
Subject [beam-site] branch asf-site updated: Fix bad website regeneration
Date Tue, 28 Nov 2017 17:17:46 GMT
This is an automated email from the ASF dual-hosted git repository.

echauchot pushed a commit to branch asf-site
in repository https://gitbox.apache.org/repos/asf/beam-site.git


The following commit(s) were added to refs/heads/asf-site by this push:
     new 7138441  Fix bad website regeneration
     new f4d0faa  This closes #355
7138441 is described below

commit 7138441f69c8a9484952b6bff13991a457f06c1a
Author: Etienne Chauchot <echauchot@apache.org>
AuthorDate: Tue Nov 28 17:20:18 2017 +0100

    Fix bad website regeneration
---
 content/documentation/sdks/java/nexmark/index.html | 804 +++++++++++++++++++++
 1 file changed, 804 insertions(+)

diff --git a/content/documentation/sdks/java/nexmark/index.html b/content/documentation/sdks/java/nexmark/index.html
new file mode 100644
index 0000000..a1d5a00
--- /dev/null
+++ b/content/documentation/sdks/java/nexmark/index.html
@@ -0,0 +1,804 @@
+<!DOCTYPE html>
+<html lang="en">
+  <head>
+  <meta charset="utf-8">
+  <meta http-equiv="X-UA-Compatible" content="IE=edge">
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <title>Nexmark benchmark suite</title>
+  <meta name="description" content="Apache Beam is an open source, unified model and set
of language-specific SDKs for defining and executing data processing workflows, and also data
ingestion and integration flows, supporting Enterprise Integration Patterns (EIPs) and Domain
Specific Languages (DSLs). Dataflow pipelines simplify the mechanics of large-scale batch
and streaming data processing and can run on a number of runtimes like Apache Flink, Apache
Spark, and Google Cloud Dataflow  [...]
+">
+  <link href="https://fonts.googleapis.com/css?family=Roboto:100,300,400" rel="stylesheet">
+  <link rel="stylesheet" href="/css/site.css">
+  <script src="https://ajax.googleapis.com/ajax/libs/jquery/2.2.0/jquery.min.js"></script>
+  <script src="/js/bootstrap.min.js"></script>
+  <script src="/js/language-switch.js"></script>
+  <script src="/js/fix-menu.js"></script>
+  <script src="/js/section-nav.js"></script>
+  <script src="/js/page-nav.js"></script>
+  <link rel="canonical" href="https://beam.apache.org/documentation/sdks/java/nexmark/"
data-proofer-ignore>
+  <link rel="shortcut icon" type="image/x-icon" href="/images/favicon.ico">
+  <link rel="alternate" type="application/rss+xml" title="Apache Beam" href="https://beam.apache.org/feed.xml">
+  <script>
+    (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
+    (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
+    m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
+    })(window,document,'script','//www.google-analytics.com/analytics.js','ga');
+    ga('create', 'UA-73650088-1', 'auto');
+    ga('send', 'pageview');
+  </script>
+</head>
+
+  <body class="body" data-spy="scroll" data-target=".page-nav" data-offset="0">
+    <nav class="header navbar navbar-fixed-top">
+    <div class="navbar-header">
+      <button type="button" class="navbar-toggle" aria-expanded="false" aria-controls="navbar">
+        <span class="sr-only">Toggle navigation</span>
+        <span class="icon-bar"></span>
+        <span class="icon-bar"></span>
+        <span class="icon-bar"></span>
+      </button>
+
+      <a href="/" class="navbar-brand" >
+        <img alt="Brand" style="height: 25px" src="/images/beam_logo_navbar.png">
+      </a>
+    </div>
+
+    <div class="navbar-mask closed"></div>
+
+    <div id="navbar" class="navbar-container closed">
+      <ul class="nav navbar-nav">
+        <li>
+          <a href="/get-started/beam-overview/">Get Started</a>
+        </li>
+        <li>
+          <a href="/documentation/">Documentation</a>
+        </li>
+        <li>
+          <a href="/documentation/sdks/java/">SDKS</a>
+        </li>
+        <li>
+          <a href="/documentation/runners/capability-matrix/">RUNNERS</a>
+        </li>
+        <li>
+          <a href="/contribute/">Contribute</a>
+        </li>
+        <li><a href="/blog">Blog</a></li>
+      </ul>
+      <ul class="nav navbar-nav navbar-right">
+        <li class="dropdown">
+          <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-haspopup="true"
aria-expanded="false"><img src="https://www.apache.org/foundation/press/kit/feather_small.png"
alt="Apache Logo" style="height:20px;"><span class="caret"></span></a>
+          <ul class="dropdown-menu dropdown-menu-right">
+            <li><a href="http://www.apache.org/">ASF Homepage</a></li>
+            <li><a href="http://www.apache.org/licenses/">License</a></li>
+            <li><a href="http://www.apache.org/security/">Security</a></li>
+            <li><a href="http://www.apache.org/foundation/thanks.html">Thanks</a></li>
+            <li><a href="http://www.apache.org/foundation/sponsorship.html">Sponsorship</a></li>
+            <li><a href="https://www.apache.org/foundation/policies/conduct">Code
of Conduct</a></li>
+          </ul>
+        </li>
+      </ul>
+    </div>
+</nav>
+
+    <div class="clearfix container-main-content">
+      <div class="section-nav closed" data-offset-top="90" data-offset-bottom="500">
+        <span class="section-nav-back glyphicon glyphicon-menu-left"></span>
+        <nav>
+          <ul class="section-nav-list" data-section-nav>
+            <li><span class="section-nav-list-main-title">SDKS</span></li>
+<li><a href="/documentation/sdks/java/">Java SDK</a></li>
+<li><a href="/documentation/sdks/javadoc/2.1.0/" target="_blank">Java SDK API
Reference <img src="/images/external-link-icon.png"
+                                                                                        
                                          width="14" height="14"
+                                                                                        
                                                     alt="External link."></a>
+</li>
+<li><a href="/documentation/sdks/python/">Python SDK</a></li>
+<li><a href="/documentation/sdks/pydoc/2.1.0/" target="_blank">Python SDK API
Reference <img src="/images/external-link-icon.png"
+                                                                                        
                                          width="14" height="14"
+                                                                                        
                                                     alt="External link."></a>
+</li>
+<li>
+  <span class="section-nav-list-title">DSLs</span>
+
+  <ul class="section-nav-list">
+    <li><a href="/documentation/dsls/sql/">SQL</a></li>
+  </ul>
+</li>
+
+          </ul>
+        </nav>
+      </div>
+
+      <nav class="page-nav clearfix" data-offset-top="90" data-offset-bottom="500">
+        
+
+<ul class="nav">
+  <li><a href="#what-it-is">What it is</a></li>
+  <li><a href="#the-queries">The queries</a></li>
+  <li><a href="#benchmark-workload-configuration">Benchmark workload configuration</a>
+    <ul>
+      <li><a href="#events-generation-defaults">Events generation (defaults)</a></li>
+      <li><a href="#windows-defaults">Windows (defaults)</a></li>
+      <li><a href="#events-proportions-defaults">Events Proportions (defaults)</a></li>
+      <li><a href="#technical">Technical</a></li>
+    </ul>
+  </li>
+  <li><a href="#nexmark-output">Nexmark output</a></li>
+  <li><a href="#benchmark-launch-configuration">Benchmark launch configuration</a>
+    <ul>
+      <li><a href="#common-configuration-parameters">Common configuration parameters</a></li>
+      <li><a href="#available-suites">Available Suites</a></li>
+      <li><a href="#apex-runner-specific-configuration">Apex runner specific
configuration</a></li>
+      <li><a href="#google-cloud-dataflow-runner-specific-configuration">Google
Cloud Dataflow runner specific configuration</a></li>
+      <li><a href="#direct-runner-specific-configuration">Direct runner specific
configuration</a></li>
+      <li><a href="#flink-runner-specific-configuration">Flink runner specific
configuration</a></li>
+      <li><a href="#spark-runner-specific-configuration">Spark runner specific
configuration</a></li>
+    </ul>
+  </li>
+  <li><a href="#current-status">Current status</a>
+    <ul>
+      <li><a href="#batch--synthetic--local">Batch / Synthetic / Local</a></li>
+      <li><a href="#streaming--synthetic--local">Streaming / Synthetic / Local</a></li>
+      <li><a href="#batch--synthetic--cluster">Batch / Synthetic / Cluster</a></li>
+      <li><a href="#streaming--synthetic--cluster">Streaming / Synthetic / Cluster</a></li>
+    </ul>
+  </li>
+  <li><a href="#running-nexmark">Running Nexmark</a>
+    <ul>
+      <li><a href="#running-smoke-suite-on-the-directrunner-local">Running SMOKE
suite on the DirectRunner (local)</a></li>
+      <li><a href="#running-smoke-suite-on-the-sparkrunner-local">Running SMOKE
suite on the SparkRunner (local)</a></li>
+      <li><a href="#running-smoke-suite-on-the-flinkrunner-local">Running SMOKE
suite on the FlinkRunner (local)</a></li>
+      <li><a href="#running-smoke-suite-on-the-apexrunner-local">Running SMOKE
suite on the ApexRunner (local)</a></li>
+      <li><a href="#running-smoke-suite-on-google-cloud-dataflow">Running SMOKE
suite on Google Cloud Dataflow</a></li>
+      <li><a href="#running-query-0-on-a-spark-cluster-with-apache-hadoop-yarn">Running
query 0 on a Spark cluster with Apache Hadoop YARN</a></li>
+    </ul>
+  </li>
+</ul>
+
+
+      </nav>
+
+      <div class="body__contained body__section-nav">
+        <h1 id="nexmark-benchmark-suite">Nexmark benchmark suite</h1>
+
+<h2 id="what-it-is">What it is</h2>
+
+<p>Nexmark is a suite of pipelines inspired by the ‘continuous data stream’
+queries in <a href="http://datalab.cs.pdx.edu/niagaraST/NEXMark/">Nexmark research
paper</a></p>
+
+<p>These are multiple queries over a three entities model representing on online auction
system:</p>
+
+<ul>
+  <li><strong>Person</strong> represents a person submitting an item for
auction and/or making a bid
+ on an auction.</li>
+  <li><strong>Auction</strong> represents an item under auction.</li>
+  <li><strong>Bid</strong> represents a bid for an item under auction.</li>
+</ul>
+
+<h2 id="the-queries">The queries</h2>
+
+<p>The queries exercise many aspects of Beam model:</p>
+
+<ul>
+  <li><strong>Query1</strong>: What are the bid values in Euro’s?
+Illustrates a simple map.</li>
+  <li><strong>Query2</strong>: What are the auctions with particular auction
numbers?
+Illustrates a simple filter.</li>
+  <li><strong>Query3</strong>: Who is selling in particular US states?
+Illustrates an incremental join (using per-key state and timer) and filter.</li>
+  <li><strong>Query4</strong>: What is the average selling price for each
auction
+category?
+Illustrates complex join (using custom window functions) and
+aggregation.</li>
+  <li><strong>Query5</strong>: Which auctions have seen the most bids in
the last period?
+Illustrates sliding windows and combiners.</li>
+  <li><strong>Query6</strong>: What is the average selling price per seller
for their
+last 10 closed auctions.
+Shares the same ‘winning bids’ core as for <strong>Query4</strong>, and
+illustrates a specialized combiner.</li>
+  <li><strong>Query7</strong>: What are the highest bids per period?
+Deliberately implemented using a side input to illustrate fanout.</li>
+  <li><strong>Query8</strong>: Who has entered the system and created an
auction in
+the last period?
+Illustrates a simple join.</li>
+</ul>
+
+<p>We have augmented the original queries with five more:</p>
+
+<ul>
+  <li><strong>Query0</strong>: Pass-through.
+Allows us to measure the monitoring overhead.</li>
+  <li><strong>Query9</strong>: Winning-bids.
+A common sub-query shared by <strong>Query4</strong> and <strong>Query6</strong>.</li>
+  <li><strong>Query10</strong>: Log all events to GCS files.
+Illustrates windows with large side effects on firing.</li>
+  <li><strong>Query11</strong>: How many bids did a user make in each session
they
+were active?
+Illustrates session windows.</li>
+  <li><strong>Query12</strong>: How many bids does a user make within a
fixed
+processing time limit?
+Illustrates working in processing time in the Global window, as
+compared with event time in non-Global windows for all the other
+queries.</li>
+</ul>
+
+<h2 id="benchmark-workload-configuration">Benchmark workload configuration</h2>
+<p>Here are some of the knobs of the benchmark workload (see <a href="https://github.com/apache/beam/blob/master/sdks/java/nexmark/src/main/java/org/apache/beam/sdk/nexmark/NexmarkConfiguration.java">NexmarkConfiguration.java</a>).</p>
+
+<p>These configuration items can be passed to the launch command line.</p>
+
+<h3 id="events-generation-defaults">Events generation (defaults)</h3>
+<ul>
+  <li>100 000 events generated</li>
+  <li>100 generator threads</li>
+  <li>Event rate in SIN curve</li>
+  <li>Initial event rate of 10 000</li>
+  <li>Event rate step of 10 000</li>
+  <li>100 concurrent auctions</li>
+  <li>1000 concurrent persons bidding / creating auctions</li>
+</ul>
+
+<h3 id="windows-defaults">Windows (defaults)</h3>
+<ul>
+  <li>size 10s</li>
+  <li>sliding period 5s</li>
+  <li>watermark hold for 0s</li>
+</ul>
+
+<h3 id="events-proportions-defaults">Events Proportions (defaults)</h3>
+<ul>
+  <li>Hot Auctions = ½</li>
+  <li>Hot Bidders =¼</li>
+  <li>Hot Sellers=¼</li>
+</ul>
+
+<h3 id="technical">Technical</h3>
+<ul>
+  <li>Artificial CPU load</li>
+  <li>Artificial IO load</li>
+</ul>
+
+<h2 id="nexmark-output">Nexmark output</h2>
+<p>Here is an example output of the Nexmark benchmark run in streaming mode with the
SMOKE suite on the (local) direct runner:</p>
+
+<pre>
+Performance:
+  Conf       Runtime(sec)         Events(/sec)         Results
+  0000                5,5              18138,9          100000
+  0001                4,2              23657,4           92000
+  0002                2,2              45683,0             351
+  0003                3,9              25348,5             444
+  0004                1,6               6207,3              40
+  0005                5,0              20173,5              12
+  0006                0,9              11376,6             401
+  0007              121,4                823,5               1
+  0008                2,5              40273,9            6000
+  0009                0,9              10695,2             298
+  0010                4,0              25025,0               1
+  0011                4,4              22655,2            1919
+  0012                3,5              28208,7            1919
+</pre>
+
+<h2 id="benchmark-launch-configuration">Benchmark launch configuration</h2>
+
+<p>We can specify the Beam runner to use with maven profiles, available profiles are:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>direct-runner
+spark-runner
+flink-runner
+apex-runner
+</code></pre>
+</div>
+
+<p>The runner must also be specified like in any other Beam pipeline using:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--runner
+</code></pre>
+</div>
+
+<p>Test data is deterministically synthesized on demand. The test
+data may be synthesized in the same pipeline as the query itself,
+or may be published to Pub/Sub.</p>
+
+<p>The query results may be:</p>
+
+<ul>
+  <li>Published to Pub/Sub.</li>
+  <li>Written to text files as plain text.</li>
+  <li>Written to text files using an Avro encoding.</li>
+  <li>Sent to BigQuery.</li>
+  <li>Discarded.</li>
+</ul>
+
+<h3 id="common-configuration-parameters">Common configuration parameters</h3>
+
+<p>Decide if batch or streaming:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--streaming=true
+</code></pre>
+</div>
+
+<p>Number of events generators:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--numEventGenerators=4
+</code></pre>
+</div>
+
+<p>Run query N:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--query=N
+</code></pre>
+</div>
+
+<h3 id="available-suites">Available Suites</h3>
+<p>The suite to run can be chosen using this configuration parameter:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--suite=SUITE
+</code></pre>
+</div>
+
+<p>Available suites are:</p>
+<ul>
+  <li>DEFAULT: Test default configuration with query 0.</li>
+  <li>SMOKE: Run the 12 default configurations.</li>
+  <li>STRESS: Like smoke but for 1m events.</li>
+  <li>FULL_THROTTLE: Like SMOKE but 100m events.</li>
+</ul>
+
+<h3 id="apex-runner-specific-configuration">Apex runner specific configuration</h3>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--manageResources=false
--monitorJobs=false
+</code></pre>
+</div>
+
+<h3 id="google-cloud-dataflow-runner-specific-configuration">Google Cloud Dataflow
runner specific configuration</h3>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--manageResources=false
--monitorJobs=true \
+--enforceEncodability=false --enforceImmutability=false
+--project=&lt;your project&gt; \
+--zone=&lt;your zone&gt; \
+--workerMachineType=n1-highmem-8 \
+--stagingLocation=&lt;a gs path for staging&gt; \
+--runner=DataflowRunner \
+--tempLocation=gs://talend-imejia/nexmark/temp/ \
+--stagingLocation=gs://talend-imejia/nexmark/temp/staging/ \
+--filesToStage=target/beam-sdks-java-nexmark-2.1.0-SNAPSHOT.jar
+</code></pre>
+</div>
+
+<h3 id="direct-runner-specific-configuration">Direct runner specific configuration</h3>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--manageResources=false
--monitorJobs=true \
+--enforceEncodability=false --enforceImmutability=false
+</code></pre>
+</div>
+
+<h3 id="flink-runner-specific-configuration">Flink runner specific configuration</h3>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--manageResources=false
--monitorJobs=true \
+--flinkMaster=local --parallelism=#numcores
+</code></pre>
+</div>
+
+<h3 id="spark-runner-specific-configuration">Spark runner specific configuration</h3>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>--manageResources=false
--monitorJobs=true \
+--sparkMaster=local \
+-Dspark.ui.enabled=false -DSPARK_LOCAL_IP=localhost -Dsun.io.serialization.extendedDebugInfo=true
+</code></pre>
+</div>
+
+<h2 id="current-status">Current status</h2>
+
+<p>These tables contain statuses of the queries runs in the different runners. Google
Cloud Dataflow and Apache Gearpump statuses are yet to come.</p>
+
+<h3 id="batch--synthetic--local">Batch / Synthetic / Local</h3>
+
+<table class="table table-bordered">
+    <tr>
+      <th>Query</th>
+      <th>Direct</th>
+      <th>Spark</th>
+      <th>Flink</th>
+      <th>Apex</th>
+    </tr>
+    <tr>
+      <td>0</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>2</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>3</td>
+      <td>ok</td>
+      <td><a href="https://issues.apache.org/jira/browse/BEAM-1115">BEAM-1115</a></td>
+      <td>ok</td>
+      <td><a href="https://issues.apache.org/jira/browse/BEAM-1114">BEAM-1114</a></td>
+    </tr>
+    <tr>
+      <td>4</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>5</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>6</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>7</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>9</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>10</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>11</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>12</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+</table>
+
+<h3 id="streaming--synthetic--local">Streaming / Synthetic / Local</h3>
+
+<table class="table table-bordered">
+    <tr>
+      <th>Query</th>
+      <th>Direct</th>
+      <th>Spark <a href="https://issues.apache.org/jira/browse/BEAM-2847">BEAM-2847</a></th>
+      <th>Flink</th>
+      <th>Apex</th>
+    </tr>
+    <tr>
+      <td>0</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>1</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>2</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>3</td>
+      <td>ok</td>
+      <td><a href="https://issues.apache.org/jira/browse/BEAM-1035">BEAM-1035</a>,
<a href="https://issues.apache.org/jira/browse/BEAM-1115">BEAM-1115</a></td>
+      <td>ok</td>
+      <td><a href="https://issues.apache.org/jira/browse/BEAM-1114">BEAM-1114</a></td>
+    </tr>
+    <tr>
+      <td>4</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>5</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>6</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>7</td>
+      <td>ok</td>
+      <td><a href="https://issues.apache.org/jira/browse/BEAM-2112">BEAM-2112</a></td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>8</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>9</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>10</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>11</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+    <tr>
+      <td>12</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+      <td>ok</td>
+    </tr>
+</table>
+
+<h3 id="batch--synthetic--cluster">Batch / Synthetic / Cluster</h3>
+
+<p>Yet to come</p>
+
+<h3 id="streaming--synthetic--cluster">Streaming / Synthetic / Cluster</h3>
+
+<p>Yet to come</p>
+
+<h2 id="running-nexmark">Running Nexmark</h2>
+
+<h3 id="running-smoke-suite-on-the-directrunner-local">Running SMOKE suite on the DirectRunner
(local)</h3>
+
+<p>Batch Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pdirect-runner -Dexec.args="--runner=DirectRunner
--suite=SMOKE --streaming=false --manageResources=false --monitorJobs=true --enforceEncodability=true
--enforceImmutability=true"
+</code></pre>
+</div>
+
+<p>Streaming Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pdirect-runner -Dexec.args="--runner=DirectRunner
--suite=SMOKE --streaming=true --manageResources=false --monitorJobs=true --enforceEncodability=true
--enforceImmutability=true"
+</code></pre>
+</div>
+
+<h3 id="running-smoke-suite-on-the-sparkrunner-local">Running SMOKE suite on the SparkRunner
(local)</h3>
+
+<p>Batch Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pspark-runner "-Dexec.args=--runner=SparkRunner
--suite=SMOKE --streamTimeout=60 --streaming=false --manageResources=false --monitorJobs=true"
+</code></pre>
+</div>
+
+<p>Streaming Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pspark-runner "-Dexec.args=--runner=SparkRunner
--suite=SMOKE --streamTimeout=60 --streaming=true --manageResources=false --monitorJobs=true"
+</code></pre>
+</div>
+
+<h3 id="running-smoke-suite-on-the-flinkrunner-local">Running SMOKE suite on the FlinkRunner
(local)</h3>
+
+<p>Batch Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pflink-runner "-Dexec.args=--runner=FlinkRunner
--suite=SMOKE --streamTimeout=60 --streaming=false --manageResources=false --monitorJobs=true
 --flinkMaster=local"
+</code></pre>
+</div>
+
+<p>Streaming Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Pflink-runner "-Dexec.args=--runner=FlinkRunner
--suite=SMOKE --streamTimeout=60 --streaming=true --manageResources=false --monitorJobs=true
 --flinkMaster=local"
+</code></pre>
+</div>
+
+<h3 id="running-smoke-suite-on-the-apexrunner-local">Running SMOKE suite on the ApexRunner
(local)</h3>
+
+<p>Batch Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Papex-runner "-Dexec.args=--runner=ApexRunner
--suite=SMOKE --streamTimeout=60 --streaming=false --manageResources=false --monitorJobs=false"
+</code></pre>
+</div>
+
+<p>Streaming Mode:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn exec:java
-Dexec.mainClass=org.apache.beam.sdk.nexmark.Main -Papex-runner "-Dexec.args=--runner=ApexRunner
--suite=SMOKE --streamTimeout=60 --streaming=true --manageResources=false --monitorJobs=false"
+</code></pre>
+</div>
+
+<h3 id="running-smoke-suite-on-google-cloud-dataflow">Running SMOKE suite on Google
Cloud Dataflow</h3>
+
+<p>Building package:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn clean package
-Pdataflow-runner
+</code></pre>
+</div>
+
+<p>Submit to Google Dataflow service:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>java -cp sdks/java/nexmark/target/beam-sdks-java-nexmark-bundled-2.1.0-SNAPSHOT.jar
\
+  org.apache.beam.sdk.nexmark.Main \
+  --runner=DataflowRunner
+  --project=&lt;your project&gt; \
+  --zone=&lt;your zone&gt; \
+  --workerMachineType=n1-highmem-8 \
+  --stagingLocation=&lt;a gs path for staging&gt; \
+  --streaming=true \
+  --sourceType=PUBSUB \
+  --pubSubMode=PUBLISH_ONLY \
+  --pubsubTopic=&lt;an existing Pubsub topic&gt; \
+  --resourceNameMode=VERBATIM \
+  --manageResources=false \
+  --monitorJobs=false \
+  --numEventGenerators=64 \
+  --numWorkers=16 \
+  --maxNumWorkers=16 \
+  --suite=SMOKE \
+  --firstEventRate=100000 \
+  --nextEventRate=100000 \
+  --ratePeriodSec=3600 \
+  --isRateLimited=true \
+  --avgPersonByteSize=500 \
+  --avgAuctionByteSize=500 \
+  --avgBidByteSize=500 \
+  --probDelayedEvent=0.000001 \
+  --occasionalDelaySec=3600 \
+  --numEvents=0 \
+  --useWallclockEventTime=true \
+  --usePubsubPublishTime=true \
+  --experiments=enable_custom_pubsub_sink
+</code></pre>
+</div>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>java -cp sdks/java/nexmark/target/beam-sdks-java-nexmark-bundled-2.1.0-SNAPSHOT.jar
\
+  org.apache.beam.sdk.nexmark.Main \
+  --runner=DataflowRunner
+  --project=&lt;your project&gt; \
+  --zone=&lt;your zone&gt; \
+  --workerMachineType=n1-highmem-8 \
+  --stagingLocation=&lt;a gs path for staging&gt; \
+  --streaming=true \
+  --sourceType=PUBSUB \
+  --pubSubMode=SUBSCRIBE_ONLY \
+  --pubsubSubscription=&lt;an existing Pubsub subscription to above topic&gt; \
+  --resourceNameMode=VERBATIM \
+  --manageResources=false \
+  --monitorJobs=false \
+  --numWorkers=64 \
+  --maxNumWorkers=64 \
+  --suite=SMOKE \
+  --usePubsubPublishTime=true \
+  --outputPath=&lt;a gs path under which log files will be written&gt; \
+  --windowSizeSec=600 \
+  --occasionalDelaySec=3600 \
+  --maxLogEvents=10000 \
+  --experiments=enable_custom_pubsub_source
+</code></pre>
+</div>
+
+<h3 id="running-query-0-on-a-spark-cluster-with-apache-hadoop-yarn">Running query 0
on a Spark cluster with Apache Hadoop YARN</h3>
+
+<p>Building package:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>mvn clean package
-Pspark-runner
+</code></pre>
+</div>
+
+<p>Submit to the cluster:</p>
+
+<div class="highlighter-rouge"><pre class="highlight"><code>spark-submit
--master yarn-client --class org.apache.beam.sdk.nexmark.Main --driver-memory 512m --executor-memory
512m --executor-cores 1 beam-sdks-java-nexmark-bundled-2.1.0-SNAPSHOT.jar --runner=SparkRunner
--query=0 --streamTimeout=60 --streaming=false --manageResources=false --monitorJobs=true
+</code></pre>
+</div>
+
+      </div>
+    </div>
+    <footer class="footer">
+  <div class="footer__contained">
+    <div class="footer__cols">
+      <div class="footer__cols__col">
+        <div class="footer__cols__col__logo">
+          <img src="/images/beam_logo_circle.svg" class="footer__logo" alt="Beam logo">
+        </div>
+        <div class="footer__cols__col__logo">
+          <img src="/images/apache_logo_circle.svg" class="footer__logo" alt="Apache logo">
+        </div>
+      </div>
+      <div class="footer__cols__col footer__cols__col--md">
+        <div class="footer__cols__col__title">Start</div>
+        <div class="footer__cols__col__link"><a href="/get-started/beam-overview/">Overview</a></div>
+        <div class="footer__cols__col__link"><a href="/get-started/quickstart-java/">Quickstart
(Java)</a></div>
+        <div class="footer__cols__col__link"><a href="/get-started/quickstart-py/">Quickstart
(Python)</a></div>
+        <div class="footer__cols__col__link"><a href="/get-started/downloads/">Downloads</a></div>
+      </div>
+      <div class="footer__cols__col footer__cols__col--md">
+        <div class="footer__cols__col__title">Docs</div>
+        <div class="footer__cols__col__link"><a href="/documentation/programming-guide/">Concepts</a></div>
+        <div class="footer__cols__col__link"><a href="/documentation/pipelines/design-your-pipeline/">Pipelines</a></div>
+        <div class="footer__cols__col__link"><a href="/documentation/runners/capability-matrix/">Runners</a></div>
+      </div>
+      <div class="footer__cols__col footer__cols__col--md">
+        <div class="footer__cols__col__title">Community</div>
+        <div class="footer__cols__col__link"><a href="/contribute/">Contribute</a></div>
+        <div class="footer__cols__col__link"><a href="/contribute/team/">Team</a></div>
+        <div class="footer__cols__col__link"><a href="/contribute/presentation-materials/">Media</a></div>
+      </div>
+      <div class="footer__cols__col footer__cols__col--md">
+        <div class="footer__cols__col__title">Resources</div>
+        <div class="footer__cols__col__link"><a href="/blog/">Blog</a></div>
+        <div class="footer__cols__col__link"><a href="/get-started/support/">Support</a></div>
+        <div class="footer__cols__col__link"><a href="https://github.com/apache/beam">GitHub</a></div>
+      </div>
+    </div>
+  </div>
+  <div class="footer__bottom">
+    &copy;
+    <a href="http://www.apache.org">The Apache Software Foundation</a>
+    | <a href="/privacy_policy">Privacy Policy</a>
+    | <a href="/feed.xml">RSS Feed</a>
+    <br><br>
+    Apache Beam, Apache, Beam, the Beam logo, and the Apache feather logo are
+    either registered trademarks or trademarks of The Apache Software
+    Foundation. All other products or name brands are trademarks of their
+    respective holders, including The Apache Software Foundation.
+  </div>
+</footer>
+
+  </body>
+</html>

-- 
To stop receiving notification emails like this one, please contact
['"commits@beam.apache.org" <commits@beam.apache.org>'].

Mime
View raw message