java监控目录实时上传HDFS

背景描述:

为了满足linux服务器上特定目录的非结构化文件的实时监控,并上传HDFS

使用的方法

Apache的Commons-IO,来实现文件的监控功能

所需要的pom

java 复制代码
<dependencies>
        <dependency>
            <groupId>org.apache.hadoop</groupId>
            <artifactId>hadoop-client</artifactId>
            <version>3.0.0</version>
        </dependency>
        <dependency>
            <groupId>org.apache.hadoop</groupId>
            <artifactId>hadoop-common</artifactId>
            <version>3.0.0</version>
        </dependency>
        <dependency>
            <groupId>commons-io</groupId>
            <artifactId>commons-io</artifactId>
            <version>2.6</version>
        </dependency>
        <dependency>
            <groupId>org.apache.commons</groupId>
            <artifactId>commons-lang3</artifactId>
            <version>3.9</version>
        </dependency>
        <dependency>
            <groupId>com.google.code.findbugs</groupId>
            <artifactId>jsr305</artifactId>
            <version>1.3.9</version>
        </dependency>
        <dependency>
            <groupId>org.projectlombok</groupId>
            <artifactId>lombok</artifactId>
            <version>1.18.4</version>
        </dependency>
        <dependency>
            <groupId>com.alibaba</groupId>
            <artifactId>fastjson</artifactId>
            <version>1.2.28</version>
            <scope>compile</scope>
        </dependency>
        <dependency>
            <groupId>com.alibaba.fastjson2</groupId>
            <artifactId>fastjson2</artifactId>
            <version>2.0.26</version>
        </dependency>
        <!-- https://mvnrepository.com/artifact/cn.hutool/hutool-all -->
        <dependency>
            <groupId>cn.hutool</groupId>
            <artifactId>hutool-all</artifactId>
            <version>5.8.22</version>
        </dependency>

    </dependencies>
java 复制代码
public static void copyFile2HDFS(URI hdfsURI, String username, String srcPath, String newPath) {
        try {
            Configuration conf = new Configuration();
            FileSystem fs = FileSystem.get(hdfsURI, conf, username);
            Path src = new Path(srcPath);
            Path dst = new Path(newPath);
            if (fs.exists(dst)) {
                fs.delete(dst, true);
            }
            fs.copyFromLocalFile(src, dst);
            fs.close();
            System.out.println("Upload Successfully!");
        } catch (Exception e) {
            e.printStackTrace();
            StaticLog.info("复制文件失败{}", e.getMessage());
        }
    }
java 复制代码
public static String getHDFSPath(File file) {
        // 判断文件格式,包括视频、图片、文本和音频等,你可以根据实际需求进行修改
        String fileName = file.getName();
        String extension = fileName.substring(fileName.lastIndexOf(".") + 1).toLowerCase();
        if (extension.equals("mp4") || extension.equals("avi") || extension.equals("mov")) {
            return "/data/shipin/" + file.getName();
        } else if (extension.equals("jpg") || extension.equals("png")) {
            return "/data/txt/" + file.getName();
        } else if (extension.equals("m4a") || extension.equals("wav")) {
            return "/data/yuyin/" + file.getName();
        } else if (extension.equals("txt")) {
            return "/data/wenjian/" + file.getName();
        } else {
            return "/data/" + file.getName();
        }
    }
复制代码
FileMonitorTest.java
java 复制代码
//
// Source code recreated from a .class file by IntelliJ IDEA
// (powered by FernFlower decompiler)
//

package com.xxx.fileSync;

import java.util.concurrent.TimeUnit;
import org.apache.commons.io.filefilter.FileFilterUtils;
import org.apache.commons.io.filefilter.IOFileFilter;
import org.apache.commons.io.monitor.FileAlterationMonitor;
import org.apache.commons.io.monitor.FileAlterationObserver;

public class FileMonitorTest {
    public FileMonitorTest() {
    }

    public static void main(String[] arugs) throws Exception {
        String absolateDir = "/opt/xxxx";
        long intervalTime = TimeUnit.SECONDS.toMillis(5L);
        new FileAlterationObserver(absolateDir, FileFilterUtils.and(new IOFileFilter[]{FileFilterUtils.fileFileFilter(), FileFilterUtils.suffixFileFilter(".success")}));
        FileAlterationObserver observer = new FileAlterationObserver(absolateDir);
        observer.addListener(new FileListener());
        FileAlterationMonitor monitor = new FileAlterationMonitor(intervalTime, new FileAlterationObserver[]{observer});
        monitor.start();
    }
}
复制代码
FileListener.java重写方法
java 复制代码
//
// Source code recreated from a .class file by IntelliJ IDEA
// (powered by FernFlower decompiler)
//

package com.xxx.fileSync;

import java.io.File;
import java.net.URI;
import java.net.URISyntaxException;
import java.nio.file.Files;
import java.nio.file.StandardCopyOption;
import org.apache.commons.io.monitor.FileAlterationListenerAdaptor;
import org.apache.commons.io.monitor.FileAlterationObserver;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class FileListener extends FileAlterationListenerAdaptor {
    private static final Logger log = LoggerFactory.getLogger(FileListener.class);
    URI uri = new URI("hdfs://xxxxx:802xx0");
    String newPath = "";
    String newHDFSPath = "";
    String userName = "root";

    public FileListener() throws URISyntaxException {
    }

    public void onStart(FileAlterationObserver observer) {
        super.onStart(observer);
    }

    public void onDirectoryCreate(File directory) {
        this.newPath = "/data" + directory.getName();
        System.out.println("文件路径:" + directory.getAbsolutePath() + " 文件夹创建:" + directory.getName());
        FileUtil.newDir2HDFS(this.uri, this.userName, this.newPath);
        log.info("[Deleted Directory] : {}", directory.getAbsolutePath());
    }

    public void onDirectoryChange(File directory) {
        log.info("[Changed Directory] : {}", directory.getAbsolutePath());
    }

    public void onDirectoryDelete(File directory) {
        log.info("[Created Directory] : {}", directory.getAbsolutePath());
    }

    public void onFileCreate(File file) {
        try {
            log.info("[Created File] : {}", file.getAbsolutePath());
            this.newHDFSPath = FileUtil.getHDFSPath(file);
            this.newPath = FileUtil.getDestPath(file);
            System.out.println("监控源文件路径:" + file.toPath());
            System.out.println("监控源文件路径:" + file.getAbsolutePath() + " 目标HDFS文件创建:" + this.newHDFSPath);
            System.out.println("监控源文件路径:" + file.getAbsolutePath() + " 目标Linux文件创建:" + this.newPath);
            FileUtil.copyFile2HDFS(this.uri, this.userName, file.getAbsolutePath(), this.newHDFSPath);
            Files.copy(file.toPath(), (new File(this.newPath)).toPath(), StandardCopyOption.REPLACE_EXISTING);
        } catch (Throwable var3) {
            throw var3;
        }
    }

    public void onFileChange(File file) {
        try {
            log.info("[Amended File] : {}", file.getAbsolutePath());
            this.newPath = FileUtil.getDestPath(file);
            FileUtil.copyFile2HDFS(this.uri, this.userName, file.getAbsolutePath(), this.newPath);
            Files.copy(file.toPath(), (new File(this.newPath)).toPath(), StandardCopyOption.REPLACE_EXISTING);
        } catch (Throwable var3) {
            throw var3;
        }
    }

    public void onFileDelete(File file) {
        try {
            log.info("[Deleted File] : {}", file.getAbsolutePath());
            this.newHDFSPath = FileUtil.getHDFSPath(file);
            this.newPath = FileUtil.getDestPath(file);
            FileUtil.delFile2HDFS(this.uri, this.userName, this.newHDFSPath);
            Files.delete((new File(this.newPath)).toPath());
        } catch (Throwable var3) {
            throw var3;
        }
    }

    public void onStop(FileAlterationObserver observer) {
        super.onStop(observer);
    }
}
相关推荐
一 乐15 小时前
校园墙|校园社区|基于Java+vue的校园墙小程序系统(源码+数据库+文档)
java·前端·数据库·vue.js·spring boot·后端·小程序
TT哇15 小时前
【面经 每日一题】面试题16.25.LRU缓存(medium)
java·算法·缓存·面试
青云交15 小时前
Java 大视界 -- 基于 Java 的大数据联邦学习在跨行业数据协同创新中的实践突破
java·分布式计算·隐私保护·apache flink·大数据联邦学习·跨行业数据协同·安全通信
合作小小程序员小小店15 小时前
桌面开发,在线%考试管理%系统,基于eclipse,java,swing,mysql数据库。
java·数据库·mysql·eclipse·jdk
T.Ree.15 小时前
汇编_读写内存
开发语言·汇编·c#
oioihoii15 小时前
C/C++混合项目中的头文件管理:.h与.hpp的分工与协作
java·c语言·c++
一瓢一瓢的饮 alanchan15 小时前
Flink原理与实战(java版)#第2章 Flink的入门(第二节Flink简介)
java·大数据·flink·kafka·实时计算·离线计算·流批一体化计算
vx_bscxy32215 小时前
告别毕设焦虑!Python 爬虫 + Java 系统 + 数据大屏,含详细开发文档 基于微信小程序的民宿预约系统22398 (上万套实战教程,赠送源码)
java·spring boot·mysql·微信小程序·课程设计
kaikaile199515 小时前
基于MATLAB的直接序列扩频(DSSS)通信系统仿真实现
开发语言·matlab
czhc114007566315 小时前
C#1114 枚举
开发语言·c#