慕课网《Kafka流处理平台》学习总结html
课程介绍java
LinkedIn 开源git
Kafka发展历程github
Kafka的特性web
Kafka一般被用于spring
Kafka是什么apache
Producer:数据生产者json
Consumer:数据消费者bootstrap
Consumer Group:消费者组缓存
Broker:服务节点
Topic:主题
Partition:分区
Replication:分区的副本
Replication Leader:副本的老大
Replication Manager:副本的管理者
Partition:分区
Replication:分区的副本
Kafka功能结构
Kafka数据流势
Kafka消息结构
Kafka特色:分布式
Kafka特色:高性能
Kafka特色:持久性与扩展性
Kafka应用场景
Kafka简单案例
学习笔记
1.下载与安装 Zookeeper下载:https://zookeeper.apache.org/releases.html#download Kafka下载:http://kafka.apache.org/downloads 安装:解压、配置环境变量 2.Zookeeper启动 解压:tar -zxf zookeeper-3.4.12.tar.gz 目录:cd zookeeper-3.4.12/bin 启动:./zkServer.sh start /home/zc/server/kafka_2.12-2.0.0/config/zookeeper.properties 3.Kafka启动 解压:tar -zxf kafka_2.12-2.0.0.tgz 目录:cd kafka_2.12-2.0.0 启动:sudo bin/kafka-server-start.sh config/server.properties 4.使用控制台操做生产者与消费者 建立Topic:sudo ./bin/kafka-topics.sh --create --zookeeper localhost:2181 --replication-factor 1 --partitions 3 --topic myimooc-kafka-topic 查看Topic:sudo ./bin/kafka-topics.sh --list --zookeeper localhost:2181 启动生产者:sudo ./bin/kafka-console-producer.sh --broker-list localhost:9092 --topic myimooc-kafka-topic 启动消费者:sudo ./bin/kafka-console-consumer.sh --bootstrap-server localhost:9092 --topic myimooc-kafka-topic --from-beginning 生产消息:first message 生产消息:second message
建立49-kafka-example的maven工程pom以下
<?xml version="1.0" encoding="UTF-8"?> <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> <parent> <artifactId>49-kafka</artifactId> <groupId>com.myimooc</groupId> <version>1.0-SNAPSHOT</version> </parent> <modelVersion>4.0.0</modelVersion> <artifactId>49-kafka-example</artifactId> <properties> <spring.boot.version>2.0.4.RELEASE</spring.boot.version> </properties> <dependencyManagement> <dependencies> <dependency> <groupId>org.springframework.boot</groupId> <artifactId>spring-boot-parent</artifactId> <version>${spring.boot.version}</version> <type>pom</type> <scope>import</scope> </dependency> </dependencies> </dependencyManagement> <dependencies> <dependency> <groupId>org.springframework.boot</groupId> <artifactId>spring-boot-starter-web</artifactId> </dependency> <dependency> <groupId>org.springframework.kafka</groupId> <artifactId>spring-kafka</artifactId> </dependency> <dependency> <groupId>com.alibaba</groupId> <artifactId>fastjson</artifactId> <version>1.2.36</version> </dependency> <dependency> <groupId>org.springframework.boot</groupId> <artifactId>spring-boot-starter-test</artifactId> <scope>test</scope> </dependency> </dependencies> <build> <plugins> <plugin> <groupId>org.springframework.boot</groupId> <artifactId>spring-boot-maven-plugin</artifactId> </plugin> </plugins> </build> </project>
1.编写MessageEntity
package com.myimooc.kafka.example.common; import java.util.Objects; /** * <br> * 标题: 消息实体<br> * 描述: 消息实体<br> * 时间: 2018/09/09<br> * * @author zc */ public class MessageEntity { /** * 标题 */ private String title; /** * 内容 */ private String body; @Override public String toString() { return "MessageEntity{" + "title='" + title + '\'' + ", body='" + body + '\'' + '}'; } @Override public boolean equals(Object o) { if (this == o) { return true; } if (o == null || getClass() != o.getClass()) { return false; } MessageEntity that = (MessageEntity) o; return Objects.equals(title, that.title) && Objects.equals(body, that.body); } @Override public int hashCode() { return Objects.hash(title, body); } public String getTitle() { return title; } public void setTitle(String title) { this.title = title; } public String getBody() { return body; } public void setBody(String body) { this.body = body; } }
2.编写SimpleProducer
package com.myimooc.kafka.example.producer; import com.alibaba.fastjson.JSON; import org.apache.kafka.clients.producer.ProducerRecord; import org.apache.kafka.clients.producer.RecordMetadata; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.kafka.core.KafkaTemplate; import org.springframework.kafka.support.SendResult; import org.springframework.stereotype.Component; import org.springframework.util.concurrent.ListenableFuture; import org.springframework.util.concurrent.ListenableFutureCallback; /** * <br> * 标题: 生产者<br> * 描述: 生产者<br> * 时间: 2018/09/09<br> * * @author zc */ @Component public class SimpleProducer<T> { private Logger logger = LoggerFactory.getLogger(getClass()); @Autowired private KafkaTemplate<String, Object> kafkaTemplate; public void send(String topic, String key, Object entity) { logger.info("发送消息入参:{}", entity); ProducerRecord<String, Object> record = new ProducerRecord<>( topic, key, JSON.toJSONString(entity) ); long startTime = System.currentTimeMillis(); ListenableFuture<SendResult<String, Object>> future = this.kafkaTemplate.send(record); future.addCallback(new ListenableFutureCallback<SendResult<String, Object>>() { @Override public void onFailure(Throwable ex) { logger.error("消息发送失败:{}", ex); } @Override public void onSuccess(SendResult<String, Object> result) { long elapsedTime = System.currentTimeMillis() - startTime; RecordMetadata metadata = result.getRecordMetadata(); StringBuilder record = new StringBuilder(128); record.append("message(") .append("key = ").append(key).append(",") .append("message = ").append(entity).append(")") .append("send to partition(").append(metadata.partition()).append(")") .append("with offset(").append(metadata.offset()).append(")") .append("in ").append(elapsedTime).append(" ms"); logger.info("消息发送成功:{}", record.toString()); } }); } }
3.编写SimpleConsumer
package com.myimooc.kafka.example.consumer; import com.alibaba.fastjson.JSONObject; import com.myimooc.kafka.example.common.MessageEntity; import org.apache.kafka.clients.consumer.ConsumerRecord; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.springframework.kafka.annotation.KafkaListener; import org.springframework.kafka.support.KafkaHeaders; import org.springframework.messaging.handler.annotation.Header; import org.springframework.stereotype.Component; import java.util.Optional; /** * <br> * 标题: 消费者<br> * 描述: 消费者<br> * 时间: 2018/09/09<br> * * @author zc */ @Component public class SimpleConsumer { private Logger logger = LoggerFactory.getLogger(getClass()); @KafkaListener(topics = "${kafka.topic.default}") public void listen(ConsumerRecord<?, ?> record, @Header(KafkaHeaders.RECEIVED_TOPIC) String topic) { //判断是否NULL Optional<?> kafkaMessage = Optional.ofNullable(record.value()); if (kafkaMessage.isPresent()) { //获取消息 Object message = kafkaMessage.get(); MessageEntity messageEntity = JSONObject.parseObject(message.toString(), MessageEntity.class); logger.info("接收消息Topic:{}", topic); logger.info("接收消息Record:{}", record); logger.info("接收消息Message:{}", messageEntity); } } }
4.编写Response
package com.myimooc.kafka.example.common; import java.io.Serializable; /** * <br> * 标题: REST请求统一响应对象<br> * 描述: REST请求统一响应对象<br> * 时间: 2018/09/09<br> * * @author zc */ public class Response implements Serializable { private static final long serialVersionUID = -972246069648445912L; /** * 响应编码 */ private int code; /** * 响应消息 */ private String message; public Response() { } public Response(int code, String message) { this.code = code; this.message = message; } @Override public String toString() { return "Response{" + "code=" + code + ", message='" + message + '\'' + '}'; } public int getCode() { return code; } public void setCode(int code) { this.code = code; } public String getMessage() { return message; } public void setMessage(String message) { this.message = message; } }
5.编写ErrorCode
package com.myimooc.kafka.example.common; /** * <br> * 标题: 错误编码<br> * 描述: 错误编码<br> * 时间: 2018/09/09<br> * * @author zc */ public class ErrorCode { /** * 成功 */ public final static int SUCCESS = 200; /** * 失败 */ public final static int EXCEPTION = 500; }
6.编写ProducerController
package com.myimooc.kafka.example.controller; import com.alibaba.fastjson.JSON; import com.myimooc.kafka.example.common.ErrorCode; import com.myimooc.kafka.example.common.MessageEntity; import com.myimooc.kafka.example.common.Response; import com.myimooc.kafka.example.producer.SimpleProducer; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Value; import org.springframework.web.bind.annotation.*; /** * <br> * 标题: 生产者Controller<br> * 描述: 生产者Controller<br> * 时间: 2018/09/09<br> * * @author zc */ @RestController @RequestMapping("/producer") public class ProducerController { private Logger logger = LoggerFactory.getLogger(getClass()); @Autowired private SimpleProducer simpleProducer; @Value("${kafka.topic.default}") private String topic; private static final String KEY = "key"; @PostMapping("/send") public Response sendKafka(@RequestBody MessageEntity message) { try { logger.info("kafka的消息:{}", JSON.toJSONString(message)); this.simpleProducer.send(topic, KEY, message); logger.info("kafka消息发送成功!"); return new Response(ErrorCode.SUCCESS,"kafka消息发送成功"); } catch (Exception ex) { logger.error("kafka消息发送失败:", ex); return new Response(ErrorCode.EXCEPTION,"kafka消息发送失败"); } } }
7.编写application.properties
##----------kafka配置 ## TOPIC kafka.topic.default=myimooc-kafka-topic # kafka地址 spring.kafka.bootstrap-servers=192.168.0.105:9092 # 生产者配置 spring.kafka.producer.retries=0 # 批量发送消息的数量 spring.kafka.producer.batch-size=4096 # 缓存容量 spring.kafka.producer.buffer-memory=40960 # 指定消息key和消息体的编解码方式 spring.kafka.producer.key-serializer=org.apache.kafka.common.serialization.StringSerializer spring.kafka.producer.value-serializer=org.apache.kafka.common.serialization.StringSerializer # 消费者配置 spring.kafka.consumer.group-id=myimooc spring.kafka.consumer.auto-commit-interval=100 spring.kafka.consumer.auto-offset-reset=latest spring.kafka.consumer.enable-auto-commit=true # 指定消息key和消息体的编解码方式 spring.kafka.consumer.key-deserializer=org.apache.kafka.common.serialization.StringDeserializer spring.kafka.consumer.value-deserializer=org.apache.kafka.common.serialization.StringDeserializer # 指定listener 容器中的线程数,用于提升并发量 spring.kafka.listener.concurrency=3
8.编写ExampleApplication
package com.myimooc.kafka.example; import org.springframework.boot.SpringApplication; import org.springframework.boot.autoconfigure.SpringBootApplication; import org.springframework.kafka.annotation.EnableKafka; /** * <br> * 标题: 启动类<br> * 描述: 启动类<br> * 时间: 2018/09/09<br> * * @author zc */ @SpringBootApplication @EnableKafka public class ExampleApplication { public static void main(String[] args) { SpringApplication.run(ExampleApplication.class, args); } }
为何要支持事务
数据传输的事务定义
事务保证
避免僵尸实例
每一个事务Procedure分配一个 transactionl. id,在进程从新启动时可以识别相同的Procedure实例
Kafka增长了一个与transactionl.id相关的epoch,存储每一个transactionl.id内部元数据
一旦epoch被触发,任务具备相同的transactionl.id和更旧的epoch的Producer被视为僵尸,Kafka会拒绝来自这些Producer的后续事务性写入
零拷贝简介
文件传输到网络的公共数据路径
零拷贝过程(指内核空间和用户空间的交互拷贝次数为零)
文件传输到网络的公共数据路径演变
课程总结