flink UTDF函数

代码示例IP解析demo案例

https://help.aliyun.com/zh/flink/developer-reference/udtfs

java 复制代码
package com.xxx.udx;


import com.alibaba.fastjson.JSON;
import com.alibaba.fastjson.JSONObject;
import com.maxmind.db.CHMCache;
import com.maxmind.geoip2.DatabaseReader;
import com.maxmind.geoip2.exception.GeoIp2Exception;
import com.maxmind.geoip2.model.CountryResponse;
import org.apache.flink.table.functions.FunctionContext;
import org.apache.flink.table.functions.TableFunction;
//import org.apache.flink.table.sources.parquet.update.UpdateVectorizedColumnRowInputParquetFormat;
import org.apache.flink.table.types.DataType;
//import org.apache.flink.table.types.DataTypes;
import org.apache.flink.types.Row;
import org.apache.http.HttpHost;
import org.apache.http.client.config.RequestConfig;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpGet;
import org.apache.http.conn.routing.HttpRoute;
import org.apache.http.impl.client.CloseableHttpClient;
import org.apache.http.impl.client.HttpClientBuilder;
import org.apache.http.impl.client.HttpClients;
import org.apache.http.impl.conn.PoolingHttpClientConnectionManager;
import org.apache.http.util.EntityUtils;

import java.io.IOException;
import java.io.InputStream;
import java.net.InetAddress;
import java.net.UnknownHostException;

/**
 * 使用节点ip解析服务
 */

public class GetResolveIp4Ip6AP extends TableFunction<Row> {
    CloseableHttpClient client = null;
    private static RequestConfig requestConfig = null;
    InputStream path =  null;
    DatabaseReader reader = null;
    @Override
    public void open(FunctionContext context) throws Exception {

        super.open(context);
        requestConfig = RequestConfig.custom()
                .setConnectTimeout(50000) //一、连接超时:connectionTimeout-->指的是连接一个url的连接等待时间
                .setSocketTimeout(5000)  // 二、读取数据超时:SocketTimeout-->指的是连接上一个url,获取response的返回等待时间
                .setConnectionRequestTimeout(5000)
                .setMaxRedirects(0)
                .build();

        client = getConnection();
        //client.getParams().setParameter(HttpMethodParams.HTTP_CONTENT_CHARSET, "UTF-8");

        path=GetResolveIp4Ip6AP.class.getResourceAsStream("/GeoLite2-Country.mmdb");
        reader = new DatabaseReader.Builder(path).withCache(new CHMCache()).build();

    }

    public void eval (String ip) throws Exception{
        String countryCode = "";
        String countryName =""; //todo 新加
        String city = "";
        String stateprov = "";

        //todo
        Row row = new Row(3);

        String res="";
        if(null != ip  && !ip.isEmpty() && ip.split("\\.").length==4 ){ //todo IP4解析
            res = doGet(ip,client);

        }else if(null != ip  && !ip.isEmpty() && !ip.equals("127.0.0.1")){//todo IP6解析

            try {
                InetAddress ipAddress = InetAddress.getByName(ip);
                //-com.maxmind.geoip2.record.Country country=null;

                CountryResponse response = reader.country(ipAddress);
                com.maxmind.geoip2.record.Country country = response.getCountry();
                countryCode= country.getIsoCode();

            }catch (Exception e){
                System.out.println("IP:"+ip);
                e.printStackTrace();
            }

            String deal_countryCode;
            if(countryCode==null|| countryCode.isEmpty()){
                deal_countryCode="UNKNOWN";
            }else{
                deal_countryCode=countryCode;
            }
            row.setField(0,deal_countryCode);
            //row.setField(1,countryName);
            row.setField(1,"未知");
            row.setField(2,"未知");


            collect(row);
            return;
        }

        if(res ==""){
            row.setField(0,"UNKNOWN");
            //row.setField(1,"未知");//todo 新加
            row.setField(1,"未知");
            row.setField(2,"未知");
            collect(row);
            return;
        }

        try{
            JSONObject json = JSON.parseObject(res);
            countryCode = json.getString("country_code");
            countryName = "";//todo 新加
            stateprov = json.getString("region_name");
            city = json.getString("city");
        }catch (Exception e){
            e.printStackTrace();
        }


        if(countryCode==null || countryCode.isEmpty()){
            countryCode="UNKNOWN";
        }
        if(stateprov==null || stateprov.isEmpty()){
            stateprov="未知";
        }
        if(city==null || city.isEmpty()){
            city="未知";
        }
        row.setField(0,countryCode);
        //row.setField(1,countryName);//todo 新加
        row.setField(1,stateprov);
        row.setField(2,city);

        collect(row);



    }
    @Override
    public void close() throws Exception {
        if(null != client){
            client.close();
            reader.close();
            path.close();
        }
        super.close();
    }

    //todo flink 注掉
//    @Override
//    // 如果返回值是Row,则必须重载实现getResultType方法,显式地声明返回的字段类型。
//    public DataType getResultType(Object[] arguments, Class[] argTypes) {
//        return DataTypes.createRowType(DataTypes.STRING, DataTypes.STRING, DataTypes.STRING);
//    }

    private static CloseableHttpClient getConnection() {
        HttpHost target = new HttpHost("0.0.0.0", 80);



        PoolingHttpClientConnectionManager connectionManager = new PoolingHttpClientConnectionManager();
        connectionManager.setMaxTotal(2000);//客户端总并行链接最大数
        connectionManager.setDefaultMaxPerRoute(2000);//每个主机的最大并行链接数
        connectionManager.setMaxPerRoute(new HttpRoute(target), 2000);

        HttpClientBuilder httpBuilder = HttpClients.custom();
        httpBuilder.setConnectionManager(connectionManager);

        CloseableHttpClient httpClient = httpBuilder.build();
        return httpClient;
    }

    private static String doGet(String ip, CloseableHttpClient client) {
        //简单的对ip地址的合法性做一下验证
        if(null == ip  || ip.isEmpty() || ip.split("\\.").length!=4 ){
            return "";
        }

        if (null == client) {
            client =  getConnection();
        }
        HttpGet getMethod = new HttpGet("http://0.0.0.0:80/json/" + ip);
        getMethod.setConfig(requestConfig);
        String res = "";
        try {
            CloseableHttpResponse response = client.execute(getMethod);


            if (response.getStatusLine().getStatusCode() == 200) {
                res =  EntityUtils.toString(response.getEntity());
//                System.out.println(res);
            }
        } catch (IOException e) {
            e.printStackTrace();
        } finally {
            getMethod.releaseConnection();
        }
        return res;
    }

}
相关推荐
Elastic 中国社区官方博客1 小时前
使用 Observability Migration Platform 将 Datadog 和 Grafana 的仪表板与告警迁移到 Kibana
大数据·elasticsearch·搜索引擎·信息可视化·全文检索·grafana·datalog
jkyy20142 小时前
AI运动数字化:以技术重塑场景,健康有益赋能全域运动健康管理
大数据·人工智能·健康医疗
金融小师妹2 小时前
4月30日多因子共振节点:鲍威尔“收官效应”与权力结构重塑的预期重构
大数据·人工智能·重构·逻辑回归
2601_949925182 小时前
AI Agent如何重构跨境物流的决策?
大数据·人工智能·重构·ai agent·geo优化·物流科技
xiaoduo AI3 小时前
客服机器人问题解决率怎么统计?Agent系统自动判断是否解决,比人工回访准?
大数据·人工智能·机器人
小五兄弟4 小时前
YouTube 肖像检测扩展背后:短剧出海版权保护的技术实现与实战策略
大数据·人工智能
阿瑞说项目管理4 小时前
2026 实战入门指南:企业 Agent 到底能解决哪些工作问题?
大数据·人工智能·agent·智能体·企业级ai
ZOOOOOOU4 小时前
云边端协同架构下,门禁权限引擎的离线决策与策略续存实现
大数据·人工智能·架构
189228048614 小时前
EMMC32G-TA28闪存EMMCH26M78103CCR
大数据·人工智能·缓存
dingzd955 小时前
Facebook强化原创内容分发后跨境品牌如何重做素材策略
大数据·人工智能·新媒体运营·内容营销·跨境