blob: cc05ad6ed7dd09ac118c01c18b7fd43e372b596f [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from dataclasses import dataclass
from typing import Optional
@dataclass
class DeletionFile:
"""
Deletion file for data file, the first 4 bytes are length, the following is the bitmap content.
- The first 4 bytes are length, should equal to length().
- Next 4 bytes are the magic number, should be equal to 1581511376.
- The remaining content should be a RoaringBitmap.
"""
dv_index_path: str # The file where the vector for data file is located
offset: int # The offset where the vector for data file is located in the dv index file
length: int
cardinality: Optional[int] = None
def __eq__(self, other):
if not isinstance(other, DeletionFile):
return False
return (self.dv_index_path == other.dv_index_path and
self.offset == other.offset and
self.length == other.length and
self.cardinality == other.cardinality)
def __hash__(self):
return hash((self.dv_index_path, self.offset, self.length, self.cardinality))
def __str__(self):
return (f"DeletionFile(path='{self.dv_index_path}', offset={self.offset}, "
f"length={self.length}, cardinality={self.cardinality})")