flink UTDF函数

代码示例IP解析demo案例

https://help.aliyun.com/zh/flink/developer-reference/udtfs

java 复制代码
package com.xxx.udx;


import com.alibaba.fastjson.JSON;
import com.alibaba.fastjson.JSONObject;
import com.maxmind.db.CHMCache;
import com.maxmind.geoip2.DatabaseReader;
import com.maxmind.geoip2.exception.GeoIp2Exception;
import com.maxmind.geoip2.model.CountryResponse;
import org.apache.flink.table.functions.FunctionContext;
import org.apache.flink.table.functions.TableFunction;
//import org.apache.flink.table.sources.parquet.update.UpdateVectorizedColumnRowInputParquetFormat;
import org.apache.flink.table.types.DataType;
//import org.apache.flink.table.types.DataTypes;
import org.apache.flink.types.Row;
import org.apache.http.HttpHost;
import org.apache.http.client.config.RequestConfig;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpGet;
import org.apache.http.conn.routing.HttpRoute;
import org.apache.http.impl.client.CloseableHttpClient;
import org.apache.http.impl.client.HttpClientBuilder;
import org.apache.http.impl.client.HttpClients;
import org.apache.http.impl.conn.PoolingHttpClientConnectionManager;
import org.apache.http.util.EntityUtils;

import java.io.IOException;
import java.io.InputStream;
import java.net.InetAddress;
import java.net.UnknownHostException;

/**
 * 使用节点ip解析服务
 */

public class GetResolveIp4Ip6AP extends TableFunction<Row> {
    CloseableHttpClient client = null;
    private static RequestConfig requestConfig = null;
    InputStream path =  null;
    DatabaseReader reader = null;
    @Override
    public void open(FunctionContext context) throws Exception {

        super.open(context);
        requestConfig = RequestConfig.custom()
                .setConnectTimeout(50000) //一、连接超时:connectionTimeout-->指的是连接一个url的连接等待时间
                .setSocketTimeout(5000)  // 二、读取数据超时:SocketTimeout-->指的是连接上一个url,获取response的返回等待时间
                .setConnectionRequestTimeout(5000)
                .setMaxRedirects(0)
                .build();

        client = getConnection();
        //client.getParams().setParameter(HttpMethodParams.HTTP_CONTENT_CHARSET, "UTF-8");

        path=GetResolveIp4Ip6AP.class.getResourceAsStream("/GeoLite2-Country.mmdb");
        reader = new DatabaseReader.Builder(path).withCache(new CHMCache()).build();

    }

    public void eval (String ip) throws Exception{
        String countryCode = "";
        String countryName =""; //todo 新加
        String city = "";
        String stateprov = "";

        //todo
        Row row = new Row(3);

        String res="";
        if(null != ip  && !ip.isEmpty() && ip.split("\\.").length==4 ){ //todo IP4解析
            res = doGet(ip,client);

        }else if(null != ip  && !ip.isEmpty() && !ip.equals("127.0.0.1")){//todo IP6解析

            try {
                InetAddress ipAddress = InetAddress.getByName(ip);
                //-com.maxmind.geoip2.record.Country country=null;

                CountryResponse response = reader.country(ipAddress);
                com.maxmind.geoip2.record.Country country = response.getCountry();
                countryCode= country.getIsoCode();

            }catch (Exception e){
                System.out.println("IP:"+ip);
                e.printStackTrace();
            }

            String deal_countryCode;
            if(countryCode==null|| countryCode.isEmpty()){
                deal_countryCode="UNKNOWN";
            }else{
                deal_countryCode=countryCode;
            }
            row.setField(0,deal_countryCode);
            //row.setField(1,countryName);
            row.setField(1,"未知");
            row.setField(2,"未知");


            collect(row);
            return;
        }

        if(res ==""){
            row.setField(0,"UNKNOWN");
            //row.setField(1,"未知");//todo 新加
            row.setField(1,"未知");
            row.setField(2,"未知");
            collect(row);
            return;
        }

        try{
            JSONObject json = JSON.parseObject(res);
            countryCode = json.getString("country_code");
            countryName = "";//todo 新加
            stateprov = json.getString("region_name");
            city = json.getString("city");
        }catch (Exception e){
            e.printStackTrace();
        }


        if(countryCode==null || countryCode.isEmpty()){
            countryCode="UNKNOWN";
        }
        if(stateprov==null || stateprov.isEmpty()){
            stateprov="未知";
        }
        if(city==null || city.isEmpty()){
            city="未知";
        }
        row.setField(0,countryCode);
        //row.setField(1,countryName);//todo 新加
        row.setField(1,stateprov);
        row.setField(2,city);

        collect(row);



    }
    @Override
    public void close() throws Exception {
        if(null != client){
            client.close();
            reader.close();
            path.close();
        }
        super.close();
    }

    //todo flink 注掉
//    @Override
//    // 如果返回值是Row,则必须重载实现getResultType方法,显式地声明返回的字段类型。
//    public DataType getResultType(Object[] arguments, Class[] argTypes) {
//        return DataTypes.createRowType(DataTypes.STRING, DataTypes.STRING, DataTypes.STRING);
//    }

    private static CloseableHttpClient getConnection() {
        HttpHost target = new HttpHost("0.0.0.0", 80);



        PoolingHttpClientConnectionManager connectionManager = new PoolingHttpClientConnectionManager();
        connectionManager.setMaxTotal(2000);//客户端总并行链接最大数
        connectionManager.setDefaultMaxPerRoute(2000);//每个主机的最大并行链接数
        connectionManager.setMaxPerRoute(new HttpRoute(target), 2000);

        HttpClientBuilder httpBuilder = HttpClients.custom();
        httpBuilder.setConnectionManager(connectionManager);

        CloseableHttpClient httpClient = httpBuilder.build();
        return httpClient;
    }

    private static String doGet(String ip, CloseableHttpClient client) {
        //简单的对ip地址的合法性做一下验证
        if(null == ip  || ip.isEmpty() || ip.split("\\.").length!=4 ){
            return "";
        }

        if (null == client) {
            client =  getConnection();
        }
        HttpGet getMethod = new HttpGet("http://0.0.0.0:80/json/" + ip);
        getMethod.setConfig(requestConfig);
        String res = "";
        try {
            CloseableHttpResponse response = client.execute(getMethod);


            if (response.getStatusLine().getStatusCode() == 200) {
                res =  EntityUtils.toString(response.getEntity());
//                System.out.println(res);
            }
        } catch (IOException e) {
            e.printStackTrace();
        } finally {
            getMethod.releaseConnection();
        }
        return res;
    }

}
相关推荐
得物技术7 小时前
从埋点需求到规则资产:Hermes Agent 重构得物数仓工作流
大数据·llm·ai编程
久美子8 小时前
AI驱动数仓建设的Harness工程实践——本体建模、知识分层与上下文工程
大数据
大树881 天前
金刚石散热越强,管路越先见顶
大数据·运维·服务器·人工智能·ai
大志哥1231 天前
ES和Logstash日志链路系统上线后遭遇切片爆炸(解决)
大数据·elasticsearch
果丁智能1 天前
物联网智能锁赋能集中式住宿:身份核验与远程权限管控的全链路技术实践
大数据·人工智能·物联网·智能家居
ApacheSeaTunnel1 天前
实战演示 | 基于 Apache SeaTunnel 与 Apache DolphinScheduler 实现 MySQL 到 Doris 离线定时增量同步
大数据·mysql·开源·doris·数据集成·seatunnel·数据同步
weixin_397574091 天前
PDF复杂表格的1:1还原引擎:跨页表格自动拼接技术实战
大数据·人工智能·pdf
极光代码工作室1 天前
基于数据仓库的电商数据分析平台
大数据·hadoop·python·spark·数据可视化
秋名山码民1 天前
Graph RAG 深度解析:从向量检索到知识推理的技术演进
大数据·人工智能·rag
m0_380167141 天前
面向开发者的Top10加密货币数据API(2026年最新)
大数据·人工智能·区块链