flink读取csv文件

    1. 所需依赖
    <dependency>
      <groupId>org.apache.flink</groupId>
      <artifactId>flink-table</artifactId>
      <version>1.9.0</version>
    </dependency>
    <!-- https://mvnrepository.com/artifact/org.apache.flink/flink-table-api-java-bridge -->
    <dependency>
      <groupId>org.apache.flink</groupId>
      <artifactId>flink-table-api-java-bridge_2.11</artifactId>
      <version>1.9.0</version>
    </dependency>
    <dependency>
      <groupId>org.apache.flink</groupId>
      <artifactId>flink-table-planner_2.11</artifactId>
      <version>1.9.0</version>
      <scope>provided</scope>
    </dependency>
  • 2.flink读取csv文件,并使用table api创建逻辑表,使用sql进行操作
/**
 * 读取csv文件  并使用table api创建逻辑表  进行查询
 */
public class CsvSource {
    public static void main(String[] args) throws Exception {
        ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment();
        DataSet<Student> csvInput = env.readCsvFile("C:\\Users\\Lenovo\\Desktop\\test.csv")
                //设置要读取的属性列   1为读   0为不读
                .includeFields("10010")
                //忽略第一行  (忽略表头)
                .ignoreFirstLine()
                //指定对应的实体类型                 //指定对应的属性名
                .pojoType(Student.class,"name","score");
        //使用table api创建逻辑表
        BatchTableEnvironment tableEnv = BatchTableEnvironment.create(env);
        Table table = tableEnv.fromDataSet(csvInput);
        tableEnv.registerTable("test_flink",table);
        //执行sql查询
        Table result = tableEnv.sqlQuery("select * from test_flink where name = 'suns1'");
        //输出结果
        DataSet<Student> doubleDataSet = tableEnv.toDataSet(result, Student.class);
        doubleDataSet.print();
    }

你可能感兴趣的:(flink学习)