【发布时间】:2020-09-04 14:42:18
【问题描述】:
我有以下 kafka 连接器配置:
{
"name": "some-topic-connector",
"config": {
"connector.class": "io.confluent.connect.hdfs.HdfsSinkConnector",
"tasks.max": "1",
"topics": "some-topic",
"hdfs.url": "hdfs://hadoopams1",
"logs.dir": "apps/kafka-connect-preview/some-topic.logs",
"topics.dir": "apps/kafka-connect-preview/some-topic.db",
"hadoop.conf.dir": "/etc/hadoop/conf",
"flush.size": "1000000",
"rotate.interval.ms": "3600000",
"rotate.schedule.interval.ms": "86400000",
"hive.integration": "true",
"hive.metastore.uris": "thrift://metastore-1.hadoop-1.foobar.com:9083",
"hive.database": "preview",
"locale": "en_GB",
"timezone": "Europe/Berlin",
"key.converter": "org.apache.kafka.connect.storage.StringConverter",
"value.converter": "io.confluent.connect.avro.AvroConverter",
"value.converter.schema.registry.url": "http://schema-registry.preview.foobar.com",
"schema.compatibility": "BACKWARD",
"partitioner.class": "io.confluent.connect.storage.partitioner.TimeBasedPartitioner",
"partition.duration.ms": "86400000",
"path.format": "'dt'=YYYYMMdd",
"partition.field.name": "dt"
}
}
我已验证数据已成功写入 HDFS,但由于某种原因未创建 Hive 中的表。从日志中,我在 Kafka Connect 中看不到任何错误。
我做错了什么?我是否缺少某些配置或要求?
【问题讨论】:
标签: apache-kafka hive apache-kafka-connect