|
70 | 70 | "source": [
|
71 | 71 | "## Overview\n",
|
72 | 72 | "\n",
|
73 |
| - "This tutorial focuses on streaming data from a [Kafka](https://docs.confluent.io/current/getting-started.html) cluster into a `tf.data.Dataset` which is then used in conjunction with `tf.keras` for training and inference.\n", |
| 73 | + "This tutorial focuses on streaming data from a [Kafka](https://kafka.apache.org/quickstart) cluster into a `tf.data.Dataset` which is then used in conjunction with `tf.keras` for training and inference.\n", |
74 | 74 | "\n",
|
75 | 75 | "Kafka is primarily a distributed event-streaming platform which provides scalable and fault-tolerant streaming data across data pipelines. It is an essential technical component of a plethora of major enterprises where mission-critical data delivery is a primary requirement.\n",
|
76 | 76 | "\n",
|
77 |
| - "**NOTE:** A basic understanding of the [kafka components](https://docs.confluent.io/current/kafka/introduction.html) will help you in following the tutorial with ease." |
| 77 | + "**NOTE:** A basic understanding of the [kafka components](https://kafka.apache.org/documentation/#intro_concepts_and_terms) will help you in following the tutorial with ease.", |
| 78 | + "\n", |
| 79 | + "**NOTE:** A Java runtime environment is required to run this tutorial." |
78 | 80 | ]
|
79 | 81 | },
|
80 | 82 | {
|
|
180 | 182 | },
|
181 | 183 | "outputs": [],
|
182 | 184 | "source": [
|
183 |
| - "!curl -sSOL http://packages.confluent.io/archive/5.4/confluent-community-5.4.1-2.12.tar.gz\n", |
184 |
| - "!tar -xzf confluent-community-5.4.1-2.12.tar.gz" |
| 185 | + "!curl -sSOL https://downloads.apache.org/kafka/2.7.0/kafka_2.13-2.7.0.tgz\n", |
| 186 | + "!tar -xzf kafka_2.13-2.7.0.tgz" |
185 | 187 | ]
|
186 | 188 | },
|
187 | 189 | {
|
|
190 | 192 | "id": "vAzfu_WiEs4F"
|
191 | 193 | },
|
192 | 194 | "source": [
|
193 |
| - "Using the default configurations (provided by the confluent package) for spinning up the instances." |
| 195 | + "Using the default configurations (provided by Apache Kafka) for spinning up the instances." |
194 | 196 | ]
|
195 | 197 | },
|
196 | 198 | {
|
|
201 | 203 | },
|
202 | 204 | "outputs": [],
|
203 | 205 | "source": [
|
204 |
| - "!cd confluent-5.4.1 && bin/zookeeper-server-start -daemon etc/kafka/zookeeper.properties\n", |
205 |
| - "!cd confluent-5.4.1 && bin/kafka-server-start -daemon etc/kafka/server.properties\n", |
| 206 | + "!./kafka_2.13-2.7.0/bin/zookeeper-server-start.sh -daemon ./kafka_2.13-2.7.0/config/zookeeper.properties\n", |
| 207 | + "!./kafka_2.13-2.7.0/bin/kafka-server-start.sh -daemon ./kafka_2.13-2.7.0/config/server.properties\n", |
206 | 208 | "!echo \"Waiting for 10 secs until kafka and zookeeper services are up and running\"\n",
|
207 | 209 | "!sleep 10\n"
|
208 | 210 | ]
|
|
247 | 249 | },
|
248 | 250 | "outputs": [],
|
249 | 251 | "source": [
|
250 |
| - "!confluent-5.4.1/bin/kafka-topics --create --zookeeper 127.0.0.1:2181 --replication-factor 1 --partitions 1 --topic susy-train\n", |
251 |
| - "!confluent-5.4.1/bin/kafka-topics --create --zookeeper 127.0.0.1:2181 --replication-factor 1 --partitions 2 --topic susy-test\n" |
| 252 | + "!./kafka_2.13-2.7.0/bin/kafka-topics.sh --create --bootstrap-server 127.0.0.1:9092 --replication-factor 1 --partitions 1 --topic susy-train\n", |
| 253 | + "!./kafka_2.13-2.7.0/bin/kafka-topics.sh --create --bootstrap-server 127.0.0.1:9092 --replication-factor 1 --partitions 2 --topic susy-test\n" |
252 | 254 | ]
|
253 | 255 | },
|
254 | 256 | {
|
|
268 | 270 | },
|
269 | 271 | "outputs": [],
|
270 | 272 | "source": [
|
271 |
| - "!confluent-5.4.1/bin/kafka-topics --bootstrap-server 127.0.0.1:9092 --describe --topic susy-train\n", |
272 |
| - "!confluent-5.4.1/bin/kafka-topics --bootstrap-server 127.0.0.1:9092 --describe --topic susy-test\n" |
| 273 | + "!./kafka_2.13-2.7.0/bin/kafka-topics.sh --describe --bootstrap-server 127.0.0.1:9092 --topic susy-train\n", |
| 274 | + "!./kafka_2.13-2.7.0/bin/kafka-topics.sh --describe --bootstrap-server 127.0.0.1:9092 --topic susy-test\n" |
273 | 275 | ]
|
274 | 276 | },
|
275 | 277 | {
|
|
720 | 722 | },
|
721 | 723 | "outputs": [],
|
722 | 724 | "source": [
|
723 |
| - "!confluent-5.4.1/bin/kafka-consumer-groups --bootstrap-server 127.0.0.1:9092 --describe --group testcg\n" |
| 725 | + "!./kafka_2.13-2.7.0/bin/kafka-consumer-groups.sh --bootstrap-server 127.0.0.1:9092 --describe --group testcg\n" |
724 | 726 | ]
|
725 | 727 | },
|
726 | 728 | {
|
|
0 commit comments