From 34feaded5fb173f9ac6ee9ddc9288dc265ba7cc1 Mon Sep 17 00:00:00 2001 From: Emmanuelveslin <41759142+Emmanuelveslin@users.noreply.github.com> Date: Sun, 6 Oct 2019 00:15:00 +0530 Subject: [PATCH] serialization is done properly --- serialization.java | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100644 serialization.java diff --git a/serialization.java b/serialization.java new file mode 100644 index 00000000..54cfa90e --- /dev/null +++ b/serialization.java @@ -0,0 +1,19 @@ +import org.apache.spark._ +import play.api.libs.json._ +import play.api.libs.functional.syntax._ + +case class Person(name: String, lovesPandas: Boolean) +implicit val personReads = Json.format[Person] + +val text = """{"name":"Sparky The Bear", "lovesPandas":true}""" + +val input = sc.parallelize(List(text)) +val parsed = input.map(Json.parse(_)) +val result = parsed.flatMap(record => { + personReads.reads(record).asOpt +}) +result.filter(_.lovesPandas).map(Json.toJson(_)).saveAsTextFile("files/out/pandainfo.json") + + + +