kafka-compression.td 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171
  1. # Copyright Materialize, Inc. and contributors. All rights reserved.
  2. #
  3. # Use of this software is governed by the Business Source License
  4. # included in the LICENSE file at the root of this repository.
  5. #
  6. # As of the Change Date specified in that file, in accordance with
  7. # the Business Source License, use of this software will be governed
  8. # by the Apache License, Version 2.0.
  9. $ set-arg-default default-storage-size=1
  10. $ set-arg-default single-replica-cluster=quickstart
  11. # Test support for compressed Kafka topics.
  12. $ postgres-execute connection=postgres://mz_system:materialize@${testdrive.materialize-internal-sql-addr}
  13. ALTER SYSTEM SET max_clusters = 20
  14. $ kafka-create-topic topic=gzip compression=gzip
  15. $ kafka-ingest format=bytes topic=gzip timestamp=1
  16. hello
  17. world
  18. > CREATE CONNECTION kafka_conn
  19. TO KAFKA (BROKER '${testdrive.kafka-addr}', SECURITY PROTOCOL PLAINTEXT);
  20. > CREATE CLUSTER gzip_cluster SIZE '${arg.default-storage-size}';
  21. > CREATE SOURCE gzip
  22. IN CLUSTER gzip_cluster
  23. FROM KAFKA CONNECTION kafka_conn (TOPIC 'testdrive-gzip-${testdrive.seed}')
  24. FORMAT TEXT
  25. > SELECT text FROM gzip
  26. hello
  27. world
  28. $ kafka-create-topic topic=snappy compression=snappy
  29. $ kafka-ingest format=bytes topic=snappy timestamp=1
  30. hello
  31. world
  32. > CREATE CLUSTER snappy_cluster SIZE '${arg.default-storage-size}';
  33. > CREATE SOURCE snappy
  34. IN CLUSTER snappy_cluster
  35. FROM KAFKA CONNECTION kafka_conn (TOPIC 'testdrive-snappy-${testdrive.seed}')
  36. FORMAT TEXT
  37. > SELECT text FROM snappy
  38. hello
  39. world
  40. $ kafka-create-topic topic=lz4 compression=lz4
  41. $ kafka-ingest format=bytes topic=lz4 timestamp=1
  42. hello
  43. world
  44. > CREATE CLUSTER lz4_cluster SIZE '${arg.default-storage-size}';
  45. > CREATE SOURCE lz4
  46. IN CLUSTER lz4_cluster
  47. FROM KAFKA CONNECTION kafka_conn (TOPIC 'testdrive-lz4-${testdrive.seed}')
  48. FORMAT TEXT
  49. > SELECT text FROM lz4
  50. hello
  51. world
  52. $ kafka-create-topic topic=zstd compression=zstd partitions=1
  53. $ kafka-ingest format=bytes topic=zstd timestamp=1
  54. hello
  55. world
  56. > CREATE CLUSTER zstd_cluster SIZE '${arg.default-storage-size}';
  57. > CREATE SOURCE zstd
  58. IN CLUSTER zstd_cluster
  59. FROM KAFKA CONNECTION kafka_conn (TOPIC 'testdrive-zstd-${testdrive.seed}')
  60. FORMAT TEXT
  61. > SELECT text FROM zstd
  62. hello
  63. world
  64. > CREATE CLUSTER zstd_fast_forwarded_cluster SIZE '${arg.default-storage-size}';
  65. > CREATE SOURCE zstd_fast_forwarded
  66. IN CLUSTER zstd_fast_forwarded_cluster
  67. FROM KAFKA CONNECTION kafka_conn (START OFFSET=[1], TOPIC 'testdrive-zstd-${testdrive.seed}')
  68. FORMAT TEXT
  69. > SELECT text FROM zstd_fast_forwarded
  70. world
  71. # Test compression with sinks.
  72. > CREATE TABLE feed (a text)
  73. > INSERT INTO feed VALUES ('hello'), ('world')
  74. ! CREATE SINK invalid_sink
  75. IN CLUSTER ${arg.single-replica-cluster}
  76. FROM feed
  77. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'pied-piper')
  78. KEY (a) NOT ENFORCED
  79. FORMAT JSON ENVELOPE UPSERT
  80. contains:invalid COMPRESSION TYPE: pied-piper
  81. > CREATE CLUSTER lz4_sink_implicit_cluster SIZE '${arg.default-storage-size}';
  82. > CREATE SINK lz4_sink_implicit
  83. IN CLUSTER lz4_sink_implicit_cluster
  84. FROM feed
  85. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'none')
  86. KEY (a) NOT ENFORCED
  87. FORMAT JSON ENVELOPE UPSERT
  88. > CREATE CLUSTER none_sink_explicit_cluster SIZE '${arg.default-storage-size}';
  89. > CREATE SINK none_sink_explicit
  90. IN CLUSTER none_sink_explicit_cluster
  91. FROM feed
  92. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression')
  93. KEY (a) NOT ENFORCED
  94. FORMAT JSON ENVELOPE UPSERT
  95. > CREATE CLUSTER gzip_sink_cluster SIZE '${arg.default-storage-size}';
  96. > CREATE SINK gzip_sink
  97. IN CLUSTER gzip_sink_cluster
  98. FROM feed
  99. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'gzip')
  100. KEY (a) NOT ENFORCED
  101. FORMAT JSON ENVELOPE UPSERT
  102. > CREATE CLUSTER gzip_sink_spongebob_case_cluster SIZE '${arg.default-storage-size}';
  103. > CREATE SINK gzip_sink_spongebob_case
  104. IN CLUSTER gzip_sink_spongebob_case_cluster
  105. FROM feed
  106. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'gZiP')
  107. KEY (a) NOT ENFORCED
  108. FORMAT JSON ENVELOPE UPSERT
  109. > CREATE CLUSTER lz4_sink_cluster SIZE '${arg.default-storage-size}';
  110. > CREATE SINK lz4_sink
  111. IN CLUSTER lz4_sink_cluster
  112. FROM feed
  113. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'lz4')
  114. KEY (a) NOT ENFORCED
  115. FORMAT JSON ENVELOPE UPSERT
  116. > CREATE CLUSTER zstd_sink_cluster SIZE '${arg.default-storage-size}';
  117. > CREATE SINK zstd_sink
  118. IN CLUSTER zstd_sink_cluster
  119. FROM feed
  120. INTO KAFKA CONNECTION kafka_conn (TOPIC 'sink-compression', COMPRESSION TYPE 'zstd')
  121. KEY (a) NOT ENFORCED
  122. FORMAT JSON ENVELOPE UPSERT
  123. # The Kafka APIs do not make it possible to assess whether the compression
  124. # actually took place, so we settle for just validating that the data is
  125. # readable.
  126. $ kafka-verify-data format=json key=false sink=materialize.public.lz4_sink_implicit
  127. {"a": "hello"}
  128. {"a": "world"}
  129. {"a": "hello"}
  130. {"a": "world"}
  131. {"a": "hello"}
  132. {"a": "world"}
  133. {"a": "hello"}
  134. {"a": "world"}
  135. {"a": "hello"}
  136. {"a": "world"}
  137. {"a": "hello"}
  138. {"a": "world"}