Java读文件写入kafka

Java读文件写入kafka

Java读文件写入kafka

文件格式

840271		103208		0	0.0	insert	84e66588-8875-4411-9cc6-0ac8302408bf	3	2	4	wangxiao	0.0	0	0.0	9927525	1619330049000	normal	1bd221d7380546be9fe8e10a63cf8130	0	0	NULL	0	0	Qw==	4253976	79

840271		103208		0	0.0	insert	cece91f8-8a17-4417-84d8-f6293849e187	3	2	4	wangxiao	0.0	0	0.0	9927525	1619330049000	normal	38204d736e8646fd956131409fc4196e	0	0	NULL	0	0	Qw==	4002760	80

pom依赖

 <dependencies>

    <dependency>

      <groupId>org.apache.kafka</groupId>

      <artifactId>kafka-clients</artifactId>

      <version>0.11.0.0</version>

      <scope>provided</scope>

    </dependency>

</dependencies>

<build>

        <!--编译的文件目录-->

        <sourceDirectory>src/main/scala</sourceDirectory>

        <resources>

            <resource>

                <directory>src/main/resources</directory>

            </resource>

        </resources>

        <plugins>

            <!-- build-helper-maven-plugin, 设置多个源文件夹 -->

            <plugin>

                <groupId>org.codehaus.mojo</groupId>

                <artifactId>build-helper-maven-plugin</artifactId>

                <version>3.0.0</version>

                <executions>

                    <execution>

                        <id>add-source</id>

                        <phase>generate-sources</phase>

                        <goals>

                            <goal>add-source</goal>

                        </goals>

                        <configuration>

                            <sources>

                                <source>src/main/java</source>

                                <source>src/main/scala</source>

                                <!-- 我们可以通过在这里添加多个source节点，来添加任意多个源文件夹 -->

                            </sources>

                        </configuration>

                    </execution>

                </executions>

            </plugin>

            <plugin>

                <artifactId>maven-assembly-plugin</artifactId>

                <configuration>

                    <descriptorRefs>

                        <descriptorRef>jar-with-dependencies</descriptorRef>

                    </descriptorRefs>

                    <archive>

                        <manifest>

                            <mainClass>com.xueersi.bdc.flink.WordCount</mainClass>

                        </manifest>

                    </archive>

                </configuration>

                <executions>

                    <execution>

                        <id>make-assembly</id>

                        <phase>package</phase>

                        <goals>

                            <goal>single</goal>

                        </goals>

                    </execution>

                </executions>

            </plugin>

            <!-- Java Compiler -->

            <plugin>

                <groupId>org.apache.maven.plugins</groupId>

                <artifactId>maven-compiler-plugin</artifactId>

                <version>3.1</version>

                <configuration>

                    <source>1.8</source>

                    <target>1.8</target>

                </configuration>

            </plugin>

            <!--Scala Compiler-->

            <plugin>

                <groupId>net.alchim31.maven</groupId>

                <artifactId>scala-maven-plugin</artifactId>

                <version>3.2.2</version>

                <executions>

                    <execution>

                        <goals>

                            <goal>compile</goal>

                            <goal>testCompile</goal>

                        </goals>

                    </execution>

                </executions>

            </plugin>

        </plugins>

    </build>

java代码

import com.alibaba.fastjson.JSON;

import com.bdc.flink.slove_problem.Ans5;

import org.apache.kafka.clients.producer.KafkaProducer;

import org.apache.kafka.clients.producer.Producer;

import org.apache.kafka.clients.producer.ProducerRecord;

import java.io.*;

import java.text.SimpleDateFormat;

import java.util.Date;

import java.util.Properties;

/**

 * @description: 读取D2数据（场景5）写入kafka

 * @author: HaoWu

 * @create: 2021年04月26日

 */

public class D2ToKafka {

    public static void main(String[] args) throws IOException, InterruptedException {

//        String bootstrap_servers = "10.90.XXXX:9092,10.90.XXXX:9092,10.90.XXXX:9092"; // 输出kafak路径

//        String topic = "test20585696test"; //输出topic

//        String path = "/Users/haowu/software/d2_test";

        String bootstrap_servers= args[0]; // 输出kafak路径

        String topic=args[1]; //输出topic

        String path = args[2]; //输入文件路径

        Properties props = new Properties();

        props.put("bootstrap.servers", bootstrap_servers);//maxwell 测试kafka集群

        props.put("acks", "all");

        props.put("retries", 1);//重试次数

        props.put("batch.size", 16384);//批次大小

        props.put("linger.ms", 1);//等待时间

        props.put("buffer.memory", 33554432);//RecordAccumulator缓冲区大小

        props.put("key.serializer", "org.apache.kafka.common.serialization.StringSerializer");

        props.put("value.serializer", "org.apache.kafka.common.serialization.StringSerializer");

        Producer<String, String> producer = new KafkaProducer<>(props);

        readTxt2Json(path, producer, topic);

    }

    public static void readTxt2Json(String path, Producer producer, String topic) throws IOException, InterruptedException {

        File file = new File(path);

        FileInputStream fis = null;

        InputStreamReader isr = null;

        BufferedReader br = null;

        try {

            fis = new FileInputStream(file);

        } catch (FileNotFoundException e) {

            e.printStackTrace();

        }

        try {

            isr = new InputStreamReader(fis, "utf-8");

        } catch (UnsupportedEncodingException e) {

            e.printStackTrace();

        }

        br = new BufferedReader(isr);

        String line = null;

        System.out.println("================== start ===================：" + System.currentTimeMillis());

        while ((line = br.readLine()) != null) {

            Ans5 ans5 = str2JsonStr(line);

            String key = ans5.getStu_id();

            String value = JSON.toJSONString(ans5);

            System.out.println(value);

            // 写入kafka

            producer.send(new ProducerRecord<>(topic, key, value));

        }

        //System.out.println(jsonStr);

        //关闭produce

        producer.close();

        System.out.println("================== end ===================：" + System.currentTimeMillis());

    }

    /**

     * 构建场景5作答bean，字符串转json字符

     *

     * @param str

     * @return

     */

    public static Ans5 str2JsonStr(String str) {

        String[] datas = str.split("\t");

        D2D3Bean bean = new D2D3Bean(datas[0], datas[1], datas[2], datas[3], datas[4], datas[5]

                , datas[6], datas[7], datas[8], datas[9], datas[10]

                , datas[11], datas[12], datas[13], datas[14], datas[15]

                , datas[16], datas[17], datas[18], datas[19], datas[20], datas[21], datas[22]

                , datas[23], datas[24], datas[25], datas[26]);

        return new Ans5(bean.getStu_id(), bean.getCourse_id(), bean.getPlan_id(), bean.getQues_id(), bean.getUser_answer(), bean.getAnswer_duration(),

               fromTimestampToHour(bean.getSub_time()), bean.getAnswer_status(), bean.getUuid(), bean.getOperate_type(), bean.getAns_scene(), bean.getRecom_id(), bean.getGrade_id(),

                bean.getSubject_id(), bean.getOrg_code(), bean.getQue_score(), bean.getStu_score(), bean.getScene_code(), bean.getQue_sort(), bean.getTest_category(), bean.getExam_id(), bean.getTest_num()

        );

    }

    /**

     * 毫秒时间戳->yyyy-MM-dd HH:mm:ss

     * @param ts

     * @return

     */

    public static String fromTimestampToHour(String ts){

        SimpleDateFormat simpleDateFormat = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");

        Date date = new Date(Long.valueOf(ts));

        return  simpleDateFormat.format(date);

    }

}

Java读文件写入kafka的更多相关文章

hdfs文件写入kafka集群
1. 场景描述因新增Kafka集群,需要将hdfs文件写入到新增的Kafka集群中,后来发现文件不多,就直接下载文件到本地,通过Main函数写入了,假如需要部署到服务器上执行,需将文件读取这块稍做修 ...
java 读文件解析
[Java]读取文件方法大全 1.按字节读取文件内容2.按字符读取文件内容3.按行读取文件内容 4.随机读取文件内容 public class ReadFromFile { /** ...
Java读文件
public class ReadFromFile { /** * 以字节为单位读取文件,常用于读二进制文件,如图片.声音.影像等文件. */ public static void readFileB ...
Java读文件夹
使用JAVA读取文件夹中的多个文件 package hx.ReadFile; import java.io.FileNotFoundException; import java.io.IOExcept ...
java读文件的几个类
链接地址:http://blog.sina.com.cn/s/blog_407a68fc0100f628.html 最初Java是不支持对文本文件的处理的,为了弥补这个缺憾而引入了Reader和Wri ...
java 读文件路径问题
文件路径:右键点击src新建Source Folder,创建结果与src目录同级. C:\Users\lenovo\workspace\timedTask\config\userinfo.proper ...
java创建文件写入内容，并实现下载该文件
public void getText(){ response.setHeader("Content-Disposition", "attachment;filename ...
JAVA读文件和写文件的的代码模版
有的时候经常为真么读写文件最合理发愁,因为JAVA提过读写文件的方式太多了(C更甚至,fopen & open又有多少人傻傻分不去,更别说ReadFile了). 这里个人绝对比较好的写法,仅供 ...
spark读文件写入mysql(scala版本)
package com.zjlantone.hive import java.util.Properties import com.zjlantone.hive.SparkOperaterHive.s ...

随机推荐

把数组排成最小的数牛客网剑指Offer
把数组排成最小的数牛客网剑指Offer 题目描述输入一个正整数数组,把数组里所有数字拼接起来排成一个数,打印能拼接出的所有数字中最小的一个.例如输入数组{3,32,321},则打印出这三个数字能 ...
hdu 5185 Equation（分析+DP）
题意: Gorwin is very interested in equations. Nowadays she gets an equation like thisx1+x2+x3+⋯+xn=n, ...
利用Wireshark 解密HTTPS流量
在我之前的一篇文章中已经介绍了一种解密HTTPS流量的一种方法,大致方法就是客户端手动信任中间人,然后中间人重新封包SSL流量. 文章地址: http://professor.blog.51cto.c ...
关于Arrays类的静态方法asList()
Array.asList():是数组转成集合的方法 List<String> list = Arrays.asList(new String[]{"AA", " ...
topk算法
方法一堆排序自建堆 heapMax方法,从上至下调整堆 pop时,可以使用自上而下调整堆,调用heapMax(arr,0,sz-1); push时,需要自下到上调整即从上到下调整: void h ...
该虚拟机似乎正在使用中。如果该虚拟机未在使用，请按“获取所有权(T)”按钮获取它的所有权
问题打开虚拟机镜像时报 VMware该虚拟机似乎正在使用中.如果该虚拟机未在使用,请按"获取所有权(T)"按钮获取它的所有权解决方法在你安装的镜像文件目录下找到后缀为.vmx ...
vuex配置token和用户信息
首先设计的是登录成功后端产生token,前端取出放在Local Storage,便于后面每个请求默认带上这里的token以及取用户相关信息和main.js同级建store.js文件,代码如下 imp ...
celery config
/* Useful celery config. app = Celery('tasks', broker='redis://localhost:6379', backend='redis://loc ...
Qt Creator 源码学习笔记02，认识框架结构
阅读本文大概需要 6 分钟在上一篇大概了解了关于Qt Creator 基础知识后[1],本篇先学习下框架基本结构,这样能够清晰的知道这个框架当中包含哪些文件.文件夹.工程文件,这些文件分别代表什么意 ...
VC练习一
1 #include<windows.h> 2 #include<stdio.h> 3 LRESULT CALLBACK WinSunProc(HWND hwnd,UINT u ...

Java读文件写入kafka

Java读文件写入kafka

文件格式

pom依赖

java代码

Java读文件写入kafka的更多相关文章

随机推荐

热门专题