Skip to content

Commit

Permalink
adding PartitionerBolt again
Browse files Browse the repository at this point in the history
  • Loading branch information
wowasa committed Apr 23, 2023
1 parent 5727105 commit 3d5971a
Show file tree
Hide file tree
Showing 2 changed files with 22 additions and 6 deletions.
14 changes: 11 additions & 3 deletions crawler-test.flux
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,9 @@ spouts:
parallelism: 1

bolts:
- id: "partitioner"
className: "com.digitalpebble.stormcrawler.bolt.URLPartitionerBolt"
parallelism: 1
- id: "fetcher"
className: "eu.clarin.linkchecker.bolt.MetricsFetcherBolt"
parallelism: 1
Expand All @@ -24,17 +27,22 @@ bolts:

streams:
- from: "spout"
to: "fetcher"
to: "partitioner"
grouping:
type: SHUFFLE
- from: "partitioner"
to: "fetcher"
grouping:
type: FIELDS
args: ["key"]
- from: "fetcher"
to: "status"
grouping:
type: FIELDS
args: ["url"]
streamId: "status"
- from: "fetcher"
to: "fetcher"
to: "partitioner"
grouping:
type: SHUFFLE
streamId: "redirect"
streamId: "redirect"
14 changes: 11 additions & 3 deletions crawler.flux
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,9 @@ spouts:
parallelism: 1

bolts:
- id: "partitioner"
className: "com.digitalpebble.stormcrawler.bolt.URLPartitionerBolt"
parallelism: 1
- id: "fetcher"
className: "eu.clarin.linkchecker.bolt.MetricsFetcherBolt"
parallelism: 1
Expand All @@ -24,17 +27,22 @@ bolts:

streams:
- from: "spout"
to: "fetcher"
to: "partitioner"
grouping:
type: SHUFFLE
- from: "partitioner"
to: "fetcher"
grouping:
type: FIELDS
args: ["key"]
- from: "fetcher"
to: "status"
grouping:
type: FIELDS
args: ["url"]
streamId: "status"
- from: "fetcher"
to: "fetcher"
to: "partitioner"
grouping:
type: SHUFFLE
streamId: "redirect"
streamId: "redirect"

0 comments on commit 3d5971a

Please sign in to comment.