今天写了一个稍微复杂的例子, 实现了类似MysqL group_concat 功能,记录一下
MapToString 参考bug 那篇博客
MapToString 参考bug 那篇博客
public static void main(String[] arg) throws Exception { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); BatchTableEnvironment tableEnv = new BatchTableEnvironment(env,TableConfig.DEFAULT()); tableEnv.registerFunction("mapToString",new MapToString()); getProjectInfo(env,tableEnv); getProject(env,tableEnv); joinTableProjectWithInfo(tableEnv); Table query = tableEnv.sqlQuery("select id,name,type from result_agg"); DataSet<Row> ds= tableEnv.toDataSet(query,Row.class); ds.print(); ds.writeAsText("/home/test",WriteMode.OVERWRITE); env.execute("multiple-table"); } public static void getProjectInfo(ExecutionEnvironment env,BatchTableEnvironment tableEnv) { Type@R_922_4045@ion[] fieldTypes = new Type@R_922_4045@ion[] { BasicTypeInfo.STRING_TYPE_INFO,BasicTypeInfo.STRING_TYPE_INFO }; String[] fieldNames = new String[] { "id","type" }; RowTypeInfo rowTypeInfo = new RowTypeInfo(fieldTypes,fieldNames); JDBCInputFormat jdbcInputFormat = JDBCInputFormat.buildJDBCInputFormat().setDrivername("com.MysqL.jdbc.Driver") .setDBUrl("jdbc:MysqL://ip:3306/space?characterEncoding=utf8") .setUsername("user").setPassword("pwd") .setQuery("select project_fid,cast(project_info_type as CHAR) as type from project").setRowTypeInfo(rowTypeInfo).finish(); DataSource<Row> s = env.createInput(jdbcInputFormat); tableEnv.registerDataSet("project_info",s); aggProjectInfo(tableEnv,"project_info"); } public static void aggProjectInfo(BatchTableEnvironment tableEnv,String tableName) { Table tapiResult = tableEnv.scan(tableName); tapiResult.printSchema(); Table query = tableEnv.sqlQuery("select id,mapToString(collect(type)) as type from project_info group by id"); tableEnv.registerTable(tableName+"_agg",query); tapiResult = tableEnv.scan(tableName+"_agg"); tapiResult.printSchema(); } public static void getProject(ExecutionEnvironment env,BasicTypeInfo.STRING_TYPE_INFO }; String[] fieldNames = new String[] { "pid","name" }; RowTypeInfo rowTypeInfo = new RowTypeInfo(fieldTypes,fieldNames); JDBCInputFormat jdbcInputFormat = JDBCInputFormat.buildJDBCInputFormat().setDrivername("com.MysqL.jdbc.Driver") .setDBUrl("jdbc:MysqL://ip:3306/space?characterEncoding=utf8") .setUsername("user").setPassword("pwd") .setQuery("select fid,project_name from t_project").setRowTypeInfo(rowTypeInfo).finish(); DataSource<Row> s = env.createInput(jdbcInputFormat); tableEnv.registerDataSet("project",s); } public static void joinTableProjectWithInfo(BatchTableEnvironment tableEnv) { Table result =tableEnv.sqlQuery("select a.pid as id,a.name,b.type from project a inner join project_info_agg b on a.pid=b.id"); tableEnv.registerTable("result_agg",result); result.printSchema(); }
版权声明:本文内容由互联网用户自发贡献,该文观点与技术仅代表作者本人。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如发现本站有涉嫌侵权/违法违规的内容, 请发送邮件至 [email protected] 举报,一经查实,本站将立刻删除。