HDFS文件的tail
2013-12-05 18:00
190 查看
package com.xxx.hdfstail;
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IOUtils;
public class HDFSTailByLine_V4 {
String src;
Path path = null;
Configuration conf;
FileSystem srcFs;
public HDFSTailByLine_V4(String src) {
this.src = src;
path = new Path(src);
conf = new Configuration();
try {
srcFs = path.getFileSystem(conf);
} catch (IOException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
private void tail() throws IOException {
if (srcFs.isDirectory(path)) {
throw new IOException("Source must be a file.");
}
long fileSize = srcFs.getFileStatus(path).getLen();
// 跳到最后一1024处开始tail
long offset = 0;
while (true) {
System.out.println(fileSize + " " + offset);
FSDataInputStream in = srcFs.open(path);
in.seek(offset);
BufferedReader reader = new BufferedReader(
new InputStreamReader(in));
String tmp;
while ((tmp = reader.readLine()) != null) {
System.out.println(tmp);
System.out.println("===+++++===");
}
offset = in.getPos();
in.close();
reader.close();
System.out.println("=========");
try {
Thread.sleep(3000);
} catch (InterruptedException e) {
break;
}
System.out.println("sleep 3 s !");
}
}
public static void main(String[] args) throws Exception {
// String flumeAdd=args[1];
// String src=args[0];
String src = "hdfs://192.168.1.132:9000/user/hive/warehouse/log_asjh/ASJH_2013-12-05/ASJH_2013-12-05_00000";
// src=args[0];
HDFSTailByLine_V4 t = new HDFSTailByLine_V4(src);
t.tail();
}
}
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IOUtils;
public class HDFSTailByLine_V4 {
String src;
Path path = null;
Configuration conf;
FileSystem srcFs;
public HDFSTailByLine_V4(String src) {
this.src = src;
path = new Path(src);
conf = new Configuration();
try {
srcFs = path.getFileSystem(conf);
} catch (IOException e) {
// TODO Auto-generated catch block
e.printStackTrace();
}
}
private void tail() throws IOException {
if (srcFs.isDirectory(path)) {
throw new IOException("Source must be a file.");
}
long fileSize = srcFs.getFileStatus(path).getLen();
// 跳到最后一1024处开始tail
long offset = 0;
while (true) {
System.out.println(fileSize + " " + offset);
FSDataInputStream in = srcFs.open(path);
in.seek(offset);
BufferedReader reader = new BufferedReader(
new InputStreamReader(in));
String tmp;
while ((tmp = reader.readLine()) != null) {
System.out.println(tmp);
System.out.println("===+++++===");
}
offset = in.getPos();
in.close();
reader.close();
System.out.println("=========");
try {
Thread.sleep(3000);
} catch (InterruptedException e) {
break;
}
System.out.println("sleep 3 s !");
}
}
public static void main(String[] args) throws Exception {
// String flumeAdd=args[1];
// String src=args[0];
String src = "hdfs://192.168.1.132:9000/user/hive/warehouse/log_asjh/ASJH_2013-12-05/ASJH_2013-12-05_00000";
// src=args[0];
HDFSTailByLine_V4 t = new HDFSTailByLine_V4(src);
t.tail();
}
}
相关文章推荐
- 编写agent,执行tail命令将文件导入hdfs,并设置以时间为目录进行存放
- 02、创建RDD(集合、本地文件、HDFS文件)
- Spark中加载本地(或者hdfs)文件以及SparkContext实例的textFile使用
- hdfs判断文件是否存在
- HDFS 上传文件不均衡和Balancer太慢的问题
- shell遍历hdfs上的文件目录
- spark:学习过程中遇到的一些问题及解决方法(如何将本地文件发布到HDFS)--11
- [置顶] HDFS文件内容追加(Append)
- linux hadoop mount 加载HDFS到本地文件系统
- 使用Hadoop API操作HDFS文件时遇到的问题及解决总结
- HDFS文件系统内的文件格式转换(zip格式转化成gzip格式)
- HDFS读写文件流程
- 文件显示命令:cat、more、less、tail、touch详解
- flink使用BucketingSink将文件写入hdfs
- linux学习笔记-第四课-cp,mkdir,rm,mv,cat,tac,tail,head,文件属性,权限
- java实现-hdfs上的文件上传下载(windows)
- HDFS源码分析(一)-----INode文件节点
- HDFS之globStatus()函数(用通配符匹配制定模式的路径)liststatus() (列出目录下的所有文件)
- hdfs源码剖析文件写入过程时序图
- Java实现HDFS文件操作工具类