{"id":1952,"date":"2020-08-18T11:52:32","date_gmt":"2020-08-18T15:52:32","guid":{"rendered":"http:\/\/sys4seq.com\/?p=1952"},"modified":"2022-06-08T11:31:03","modified_gmt":"2022-06-08T15:31:03","slug":"building-a-real-time-big-data-pipeline-6-spark-core-hadoop-sbt","status":"publish","type":"post","link":"https:\/\/sys4seq.com\/index.php\/2020\/08\/18\/building-a-real-time-big-data-pipeline-6-spark-core-hadoop-sbt\/","title":{"rendered":"Building a real-time big data pipeline 6: Spark Core, Hadoop, SBT"},"content":{"rendered":"<p>Apache Spark\u00a0<sup id=\"fnref:1\" role=\"doc-noteref\"><\/sup>is an open-source cluster computing system that provides high-level APIs in Java, Scala, Python and R. Spark also packaged with higher-level libraries for SQL, machine learning (MLlib), streaming, and graphs (GraphX).<\/p>\n<p><a href=\"https:\/\/adinasarapu.github.io\/posts\/2020\/08\/blog-post-spark-sbt\/\" target=\"_blank\" rel=\"noopener\">&gt;&gt;&gt;<\/a><\/p>\n<p>&nbsp;<\/p>\n","protected":false},"excerpt":{"rendered":"Apache Spark\u00a0is an open-source cluster computing system that provides high-level APIs in Java, Scala, Python and R. Spark also packaged with higher-level libraries for SQL, machine learning (MLlib), streaming, and graphs (GraphX). &gt;&gt;&gt; &nbsp;","protected":false},"author":1,"featured_media":0,"comment_status":"closed","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"_mi_skip_tracking":false,"_monsterinsights_sitenote_active":false,"_monsterinsights_sitenote_note":"","_monsterinsights_sitenote_category":0},"categories":[44,43],"tags":[49,55,54],"_links":{"self":[{"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/posts\/1952"}],"collection":[{"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/comments?post=1952"}],"version-history":[{"count":9,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/posts\/1952\/revisions"}],"predecessor-version":[{"id":1963,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/posts\/1952\/revisions\/1963"}],"wp:attachment":[{"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/media?parent=1952"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/categories?post=1952"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/sys4seq.com\/index.php\/wp-json\/wp\/v2\/tags?post=1952"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}