Details
-
Bug
-
Status: Closed
-
Critical
-
Resolution: Not A Problem
-
None
-
None
-
None
Description
Using dockerised version of Zeppelin :
docker run -p 8080:8080 --rm --name zeppelin apache/zeppelin:0.9.0
import spark.implicits._ import org.apache.spark.SparkContext import org.apache.spark.sql.SQLContext import com.databricks.spark.xml._val sitemapRoot = "s3a://music-dev/sitemap" sc.hadoopConfiguration.set("fs.s3a.access.key", "***"); sc.hadoopConfiguration.set("fs.s3a.secret.key", "***"); val sqlcontext = new SQLContext(sc) sqlcontext.read.format("com.databricks.spark.xml") .option("rowTag", "url") .load(s"$sitemapRoot/song*") .createOrReplaceTempView("existingSongData")
dependencies :
com.databricks:spark-xml_2.11:0.9.0
org.apache.hadoop:hadoop-aws:2.7.6
stack trace :
java.lang.NoClassDefFoundError: Could not initialize class org.apache.spark.rdd.RDDOperationScope$ at org.apache.spark.SparkContext.withScope(SparkContext.scala:699) at org.apache.spark.SparkContext.newAPIHadoopFile(SparkContext.scala:1146) at com.databricks.spark.xml.util.XmlFile$.withCharset(XmlFile.scala:46) at com.databricks.spark.xml.DefaultSource$$anonfun$createRelation$1.apply(DefaultSource.scala:71) at com.databricks.spark.xml.DefaultSource$$anonfun$createRelation$1.apply(DefaultSource.scala:71) at com.databricks.spark.xml.XmlRelation$$anonfun$1.apply(XmlRelation.scala:43) at com.databricks.spark.xml.XmlRelation$$anonfun$1.apply(XmlRelation.scala:42) at scala.Option.getOrElse(Option.scala:121) at com.databricks.spark.xml.XmlRelation.<init>(XmlRelation.scala:41) at com.databricks.spark.xml.XmlRelation$.apply(XmlRelation.scala:29) at com.databricks.spark.xml.DefaultSource.createRelation(DefaultSource.scala:74) at com.databricks.spark.xml.DefaultSource.createRelation(DefaultSource.scala:52) at org.apache.spark.sql.execution.datasources.DataSource.resolveRelation(DataSource.scala:318) at org.apache.spark.sql.DataFrameReader.loadV1Source(DataFrameReader.scala:223) at org.apache.spark.sql.DataFrameReader.load(DataFrameReader.scala:211) at org.apache.spark.sql.DataFrameReader.load(DataFrameReader.scala:178) ... 45 elided