I hereby claim:
- I am ewhauser on github.
- I am ewhauser (https://keybase.io/ewhauser) on keybase.
- I have a public key ASDgt9UmpXcLznvoNPS0LsfUbzCUQPcbaceAg8QC2CAZlgo
To claim this, I am signing this object:
I hereby claim:
To claim this, I am signing this object:
These notes are from Facebook's Analytics @ Scale conference. I didn't take notes from the presentation or discussions with developers, so feel free to correct any inconsistencies: | |
- Presto is an ANSI SQL engine built on top of HDFS | |
- Similar functionality to Cloudera's Impala | |
- Facebook started developing this project prior to the Impala annoucement, some different design choices | |
- Implemented in Java | |
- Queries execute around 10x faster than Hive, aggregation based queries can be 100x times faster | |
- Byte code generation is used for efficient predicate processing | |
- Efficient fixed memory data structures are used (very low GC overhead) | |
- Presto daemons do not have to run on data nodes |
#!/usr/bin/env ruby | |
require 'rubygems' | |
require 'getoptlong' | |
require 'socket' | |
require 'json' | |
require 'timeout' | |
require 'open-uri' | |
host = "localhost" |
package org.apache.flume.kafka; | |
import com.cloudera.flume.core.Event; | |
import com.cloudera.flume.core.EventImpl; | |
import com.cloudera.util.Clock; | |
import kafka.api.FetchRequest; | |
import kafka.javaapi.consumer.SimpleConsumer; | |
import kafka.message.Message; | |
import kafka.server.KafkaConfig; | |
import kafka.server.KafkaServer; |
package com.exacttarget.bloomin.jedis; | |
import com.google.common.base.Preconditions; | |
import com.twitter.common.net.pool.Connection; | |
import redis.clients.jedis.Jedis; | |
public class JedisConnection implements Connection<Jedis, Jedis> { | |
private final Jedis jedis; |
# Use csshX to open terminals on the nodes found in a search | |
# knife exec csshx.rb 'role:the_role' | |
abort("usage: knife exec csshx SEARCH_TERM") unless ARGV[2] | |
nodes = search(:node, "#{ARGV[2].to_s}").collect { |n| n.fqdn } | |
exec('csshX ' + nodes.join(' ')) unless nodes.length < 1 | |
exit 0 |