This repository has been archived by the owner on Aug 11, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathFSMSample.scala
84 lines (77 loc) · 2.53 KB
/
FSMSample.scala
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
package com.examples.spark
import cats.Id
import cats.effect.{ExitCode, IO, IOApp}
import trembita._
import trembita.spark._
import cats.syntax.all._
import cats.effect.Console.io._
import trembita.fsm._
import org.apache.spark.sql.{Encoder, Encoders, SparkSession}
import trembita.collections._
import scala.concurrent.duration._
/**
* To run this example, you need a spark-cluster.
* Use docker-compose to deploy one
*
* @see resources/spark/cluster
* */
object FSMSample extends IOApp {
sealed trait DoorState extends Serializable
case object Opened extends DoorState
case object Closed extends DoorState
implicit val doorStateEncoder: Encoder[DoorState] = Encoders.kryo[DoorState]
implicit val stateEncoder: Encoder[Map[DoorState, Int]] =
Encoders.kryo[Map[DoorState, Int]]
def sparkSample(implicit spark: SparkSession): IO[Unit] = {
import spark.implicits._
implicit val timeout: AsyncTimeout = AsyncTimeout(5.minutes)
val pipeline: DataPipeline[Int, Spark] =
Input.rdd.create(
spark.sparkContext.parallelize(
List.tabulate(5000)(i => scala.util.Random.nextInt() + i)
)
)
val withDoorState =
pipeline
.fsmByKey[Int, DoorState, Map[DoorState, Int], Int](getKey = _ % 4)(
initial = InitialState.pure(FSM.State(Opened, Map.empty))
)(_.when(Opened) {
case i if i % 2 == 0 =>
_.goto(Closed)
.modify(_.modify(Opened, default = 1)(_ + 1))
.push(_.apply(Opened) + i)
case i if i % 4 == 0 => _.stay push (i * 2)
}.when(Closed) {
case i if i % 3 == 0 =>
_.goto(Opened)
.modify(_.modify(Closed, default = 1)(_ + 1)) spam (_.apply(
Closed
) to 10)
case i if i % 2 == 0 =>
_.stay.push(_.values.sum)
}
.whenUndefined { i =>
{
println(s"Producing nothing..! [#$i]")
_.goto(Closed).change(Map.empty).dontPush
}
})
.mapK(idTo[IO])
.map(_ + 1)
withDoorState
.into(Output.array)
.run
.flatMap(s => putStrLn(s.mkString("[", ", ", "]")))
}
def run(args: List[String]): IO[ExitCode] =
IO(
SparkSession
.builder()
.master("spark://spark-master:7077")
.appName("trembita-spark")
.getOrCreate()
).bracket(use = { implicit spark: SparkSession =>
sparkSample
})(release = spark => IO { spark.stop() })
.as(ExitCode.Success)
}