Skip to content

Commit 71dd925

Browse files
committed
lint fixes
1 parent 4db1734 commit 71dd925

File tree

2 files changed

+15
-14
lines changed

2 files changed

+15
-14
lines changed

pyiceberg/table/puffin.py

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,8 @@
1717
import io
1818
import math
1919
import zlib
20-
from typing import TYPE_CHECKING, Dict, Iterable, List, Literal, Optional
20+
from collections.abc import Iterable
21+
from typing import TYPE_CHECKING, Literal
2122

2223
from pydantic import Field
2324
from pyroaring import BitMap, FrozenBitMap
@@ -65,9 +66,9 @@ def _deserialize_bitmap(pl: bytes) -> list[BitMap]:
6566
return bitmaps
6667

6768

68-
def _serialize_bitmaps(bitmaps: Dict[int, BitMap]) -> bytes:
69+
def _serialize_bitmaps(bitmaps: dict[int, BitMap]) -> bytes:
6970
"""
70-
Serializes a dictionary of bitmaps into a byte array.
71+
Serialize a dictionary of bitmaps into a byte array.
7172
7273
The format is:
7374
- 8 bytes: number of bitmaps (little-endian)
@@ -149,8 +150,8 @@ def to_vector(self) -> dict[str, "pa.ChunkedArray"]:
149150

150151

151152
class PuffinWriter:
152-
_blobs: List[PuffinBlobMetadata]
153-
_blob_payloads: List[bytes]
153+
_blobs: list[PuffinBlobMetadata]
154+
_blob_payloads: list[bytes]
154155

155156
def __init__(self) -> None:
156157
self._blobs = []
@@ -162,7 +163,7 @@ def add(
162163
referenced_data_file: str,
163164
) -> None:
164165
# 1. Create bitmaps from positions
165-
bitmaps: Dict[int, BitMap] = {}
166+
bitmaps: dict[int, BitMap] = {}
166167
cardinality = 0
167168
for pos in positions:
168169
cardinality += 1
@@ -219,7 +220,7 @@ def finish(self) -> bytes:
219220
for blob_payload in self._blob_payloads:
220221
payload_buffer.write(blob_payload)
221222

222-
updated_blobs_metadata: List[PuffinBlobMetadata] = []
223+
updated_blobs_metadata: list[PuffinBlobMetadata] = []
223224
current_offset = 4 # Start after file magic (4 bytes)
224225
for i, blob_payload in enumerate(self._blob_payloads):
225226
original_metadata_dict = self._blobs[i].model_dump(by_alias=True, exclude_none=True)

tests/table/test_puffin.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919
import pytest
2020
from pyroaring import BitMap
2121

22-
from pyiceberg.table.puffin import _deserialize_bitmap, PuffinFile, PuffinWriter, PROPERTY_REFERENCED_DATA_FILE
22+
from pyiceberg.table.puffin import PROPERTY_REFERENCED_DATA_FILE, PuffinFile, PuffinWriter, _deserialize_bitmap
2323

2424

2525
def _open_file(file: str) -> bytes:
@@ -73,10 +73,10 @@ def test_map_high_vals() -> None:
7373
_ = _deserialize_bitmap(puffin)
7474

7575

76-
def test_puffin_round_trip():
76+
def test_puffin_round_trip() -> None:
7777
# Define some deletion positions for multiple files
7878
deletions1 = [10, 20, 30]
79-
deletions2 = [5, (1 << 32) + 1] # Test with a high-bit position
79+
deletions2 = [5, (1 << 32) + 1] # Test with a high-bit position
8080

8181
file1_path = "path/to/data1.parquet"
8282
file2_path = "path/to/data2.parquet"
@@ -92,7 +92,7 @@ def test_puffin_round_trip():
9292

9393
# Assert footer metadata
9494
assert len(reader.footer.blobs) == 2
95-
95+
9696
blob1_meta = reader.footer.blobs[0]
9797
assert blob1_meta.properties[PROPERTY_REFERENCED_DATA_FILE] == file1_path
9898
assert blob1_meta.properties["cardinality"] == str(len(deletions1))
@@ -103,15 +103,15 @@ def test_puffin_round_trip():
103103

104104
# Assert the content of deletion vectors
105105
read_vectors = reader.to_vector()
106-
106+
107107
assert file1_path in read_vectors
108108
assert file2_path in read_vectors
109109

110110
assert read_vectors[file1_path].to_pylist() == sorted(deletions1)
111111
assert read_vectors[file2_path].to_pylist() == sorted(deletions2)
112112

113113

114-
def test_write_and_read_puffin_file():
114+
def test_write_and_read_puffin_file() -> None:
115115
writer = PuffinWriter()
116116
writer.add(positions=[1, 2, 3], referenced_data_file="file1.parquet")
117117
writer.add(positions=[4, 5, 6], referenced_data_file="file2.parquet")
@@ -139,7 +139,7 @@ def test_write_and_read_puffin_file():
139139
assert vectors["file2.parquet"].to_pylist() == [4, 5, 6]
140140

141141

142-
def test_puffin_file_with_no_blobs():
142+
def test_puffin_file_with_no_blobs() -> None:
143143
writer = PuffinWriter()
144144
puffin_bytes = writer.finish()
145145

0 commit comments

Comments
 (0)