Skip to main content

Posts

Showing posts from October, 2019

Apache Beam

First code in Apache Beam word count example: Word count .java file-> package com.test.training; import org.apache.beam.sdk.Pipeline; import org.apache.beam.sdk.io.TextIO; import org.apache.beam.sdk.options.PipelineOptions; import org.apache.beam.sdk.options.PipelineOptionsFactory; import org.apache.beam.sdk.transforms.Count; import org.apache.beam.sdk.transforms.DoFn; import org.apache.beam.sdk.transforms.Filter; import org.apache.beam.sdk.transforms.FlatMapElements; import org.apache.beam.sdk.transforms.MapElements; import org.apache.beam.sdk.transforms.ParDo; import org.apache.beam.sdk.values.KV; import org.apache.beam.sdk.values.PCollection; import org.apache.beam.sdk.values.TypeDescriptors; public class BasicWordCountWithExplaination { public static void main(String[] args) { // Create a PipelineOptions object. This object lets us set various execution     // options for our pipeline, such as the runner you wish to us