Pig UDFs
# Java UDFs - LzoPigStorage
package xxxxx;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.InputFormat;
import org.apache.hadoop.mapreduce.OutputFormat;
import org.apache.hadoop.mapreduce.lib.output.TextOutputFormat;
import org.apache.pig.builtin.PigStorage;
import com.hadoop.mapreduce.LzoTextInputFormat;
public class LzoPigStorage extends PigStorage {
private String delimiter = null;
public LzoPigStorage() {
super();
}
public LzoPigStorage(String delimiter) {
super(delimiter);
this.delimiter = delimiter;
}
@Override
public InputFormat<LongWritable, Text> getInputFormat() {
return new LzoTextInputFormat();
}
@Override
public OutputFormat getOutputFormat() {
return new TextOutputFormat();
}
}
// 사용
register 파일명.jar;
A = load 'data_path' using xxx.LzoPigStorage('\t') AS (.....);