- Download dataset here
* Follow the well-comented code kmeans.scala
* Follow the well-comented code kmeans.scala
| # To execute script launch this command on shell: hbase shell HBaseRestore.rb | |
| include Java | |
| java_import org.apache.hadoop.hbase.HBaseConfiguration | |
| java_import org.apache.hadoop.hbase.client.HBaseAdmin | |
| java_import org.apache.hadoop.hbase.snapshot.ExportSnapshot | |
| java_import org.apache.hadoop.hbase.TableExistsException | |
| java_import org.apache.hadoop.util.ToolRunner |
| # Checking if the hbase.snapshot.enabled property in hbase-site.xml is set to true | |
| # To execute script launch this command on shell: hbase shell HBaseBackup.rb | |
| @clusterToSave = "hdfs:///srv2:8082/hbase" | |
| # CHECK THE PATH OF HBase lib | |
| @libjars = `ls /opt/cloudera/parcels/CDH-5.4.4-1.cdh5.4.4.p0.4/lib/hbase/*.jar | tr "\n" ","` | |
| @ignore = [ /zipkin\..*/i, /.*_temp/i, /.*tmp/i, /test_.*/i, /.*_test/i, /.*_old/i ] | |
| @mappers = "2" | |
| include Java |
* Download JSON Serde at:
* http://files.cloudera.com/samples/hive-serdes-1.0-SNAPSHOT.jar
* and to renominate it as hive-serdes-1.0.jar
Add Jar to HIVE_AUX_JARS_PATH of HiveServer2: