flink UTDF函数

代码示例IP解析demo案例

https://help.aliyun.com/zh/flink/developer-reference/udtfs

java 复制代码
package com.xxx.udx;


import com.alibaba.fastjson.JSON;
import com.alibaba.fastjson.JSONObject;
import com.maxmind.db.CHMCache;
import com.maxmind.geoip2.DatabaseReader;
import com.maxmind.geoip2.exception.GeoIp2Exception;
import com.maxmind.geoip2.model.CountryResponse;
import org.apache.flink.table.functions.FunctionContext;
import org.apache.flink.table.functions.TableFunction;
//import org.apache.flink.table.sources.parquet.update.UpdateVectorizedColumnRowInputParquetFormat;
import org.apache.flink.table.types.DataType;
//import org.apache.flink.table.types.DataTypes;
import org.apache.flink.types.Row;
import org.apache.http.HttpHost;
import org.apache.http.client.config.RequestConfig;
import org.apache.http.client.methods.CloseableHttpResponse;
import org.apache.http.client.methods.HttpGet;
import org.apache.http.conn.routing.HttpRoute;
import org.apache.http.impl.client.CloseableHttpClient;
import org.apache.http.impl.client.HttpClientBuilder;
import org.apache.http.impl.client.HttpClients;
import org.apache.http.impl.conn.PoolingHttpClientConnectionManager;
import org.apache.http.util.EntityUtils;

import java.io.IOException;
import java.io.InputStream;
import java.net.InetAddress;
import java.net.UnknownHostException;

/**
 * 使用节点ip解析服务
 */

public class GetResolveIp4Ip6AP extends TableFunction<Row> {
    CloseableHttpClient client = null;
    private static RequestConfig requestConfig = null;
    InputStream path =  null;
    DatabaseReader reader = null;
    @Override
    public void open(FunctionContext context) throws Exception {

        super.open(context);
        requestConfig = RequestConfig.custom()
                .setConnectTimeout(50000) //一、连接超时:connectionTimeout-->指的是连接一个url的连接等待时间
                .setSocketTimeout(5000)  // 二、读取数据超时:SocketTimeout-->指的是连接上一个url,获取response的返回等待时间
                .setConnectionRequestTimeout(5000)
                .setMaxRedirects(0)
                .build();

        client = getConnection();
        //client.getParams().setParameter(HttpMethodParams.HTTP_CONTENT_CHARSET, "UTF-8");

        path=GetResolveIp4Ip6AP.class.getResourceAsStream("/GeoLite2-Country.mmdb");
        reader = new DatabaseReader.Builder(path).withCache(new CHMCache()).build();

    }

    public void eval (String ip) throws Exception{
        String countryCode = "";
        String countryName =""; //todo 新加
        String city = "";
        String stateprov = "";

        //todo
        Row row = new Row(3);

        String res="";
        if(null != ip  && !ip.isEmpty() && ip.split("\\.").length==4 ){ //todo IP4解析
            res = doGet(ip,client);

        }else if(null != ip  && !ip.isEmpty() && !ip.equals("127.0.0.1")){//todo IP6解析

            try {
                InetAddress ipAddress = InetAddress.getByName(ip);
                //-com.maxmind.geoip2.record.Country country=null;

                CountryResponse response = reader.country(ipAddress);
                com.maxmind.geoip2.record.Country country = response.getCountry();
                countryCode= country.getIsoCode();

            }catch (Exception e){
                System.out.println("IP:"+ip);
                e.printStackTrace();
            }

            String deal_countryCode;
            if(countryCode==null|| countryCode.isEmpty()){
                deal_countryCode="UNKNOWN";
            }else{
                deal_countryCode=countryCode;
            }
            row.setField(0,deal_countryCode);
            //row.setField(1,countryName);
            row.setField(1,"未知");
            row.setField(2,"未知");


            collect(row);
            return;
        }

        if(res ==""){
            row.setField(0,"UNKNOWN");
            //row.setField(1,"未知");//todo 新加
            row.setField(1,"未知");
            row.setField(2,"未知");
            collect(row);
            return;
        }

        try{
            JSONObject json = JSON.parseObject(res);
            countryCode = json.getString("country_code");
            countryName = "";//todo 新加
            stateprov = json.getString("region_name");
            city = json.getString("city");
        }catch (Exception e){
            e.printStackTrace();
        }


        if(countryCode==null || countryCode.isEmpty()){
            countryCode="UNKNOWN";
        }
        if(stateprov==null || stateprov.isEmpty()){
            stateprov="未知";
        }
        if(city==null || city.isEmpty()){
            city="未知";
        }
        row.setField(0,countryCode);
        //row.setField(1,countryName);//todo 新加
        row.setField(1,stateprov);
        row.setField(2,city);

        collect(row);



    }
    @Override
    public void close() throws Exception {
        if(null != client){
            client.close();
            reader.close();
            path.close();
        }
        super.close();
    }

    //todo flink 注掉
//    @Override
//    // 如果返回值是Row,则必须重载实现getResultType方法,显式地声明返回的字段类型。
//    public DataType getResultType(Object[] arguments, Class[] argTypes) {
//        return DataTypes.createRowType(DataTypes.STRING, DataTypes.STRING, DataTypes.STRING);
//    }

    private static CloseableHttpClient getConnection() {
        HttpHost target = new HttpHost("0.0.0.0", 80);



        PoolingHttpClientConnectionManager connectionManager = new PoolingHttpClientConnectionManager();
        connectionManager.setMaxTotal(2000);//客户端总并行链接最大数
        connectionManager.setDefaultMaxPerRoute(2000);//每个主机的最大并行链接数
        connectionManager.setMaxPerRoute(new HttpRoute(target), 2000);

        HttpClientBuilder httpBuilder = HttpClients.custom();
        httpBuilder.setConnectionManager(connectionManager);

        CloseableHttpClient httpClient = httpBuilder.build();
        return httpClient;
    }

    private static String doGet(String ip, CloseableHttpClient client) {
        //简单的对ip地址的合法性做一下验证
        if(null == ip  || ip.isEmpty() || ip.split("\\.").length!=4 ){
            return "";
        }

        if (null == client) {
            client =  getConnection();
        }
        HttpGet getMethod = new HttpGet("http://0.0.0.0:80/json/" + ip);
        getMethod.setConfig(requestConfig);
        String res = "";
        try {
            CloseableHttpResponse response = client.execute(getMethod);


            if (response.getStatusLine().getStatusCode() == 200) {
                res =  EntityUtils.toString(response.getEntity());
//                System.out.println(res);
            }
        } catch (IOException e) {
            e.printStackTrace();
        } finally {
            getMethod.releaseConnection();
        }
        return res;
    }

}
相关推荐
工作中的程序员3 小时前
flink keyby使用与总结 基础片段梳理
大数据·flink
Hy行者勇哥3 小时前
数据中台的数据源与数据处理流程
大数据·前端·人工智能·学习·个人开发
00后程序员张3 小时前
RabbitMQ核心机制
java·大数据·分布式
AutoMQ4 小时前
10.17 上海 Google Meetup:从数据出发,解锁 AI 助力增长的新边界
大数据·人工智能
武子康4 小时前
大数据-119 - Flink Flink 窗口(Window)全解析:Tumbling、Sliding、Session 应用场景 使用详解 最佳实践
大数据·后端·flink
阿水实证通4 小时前
能源经济大赛选题推荐:新能源汽车试点城市政策对能源消耗的负面影响——基于技术替代效应的视角
大数据·人工智能·汽车
nihaoma30205 小时前
[JS]JavaScript的性能优化从内存泄露到垃圾回收的实战解析
flink
TomCode先生5 小时前
SaaS版MES系统PC端后台功能清单与设计说明
大数据