def __init__(self, discovered_files: etl.file_sets.TableFileSet) -> None:
# Basic properties to locate files describing the relation
self._fileset = discovered_files
if discovered_files.scheme == "s3":
self.bucket_name = discovered_files.netloc
self.prefix = discovered_files.path
else:
self.bucket_name = None
self.prefix = None
# Note the subtle difference to TableFileSet--here the manifest_file_name is always present since it's computed
self.manifest_file_name = os.path.join(discovered_files.path or "", "data", self.source_path_name + ".manifest")
# Lazy-loading of table design and query statement and any derived information from the table design
self._table_design = None # type: Optional[Dict[str, Any]]
self._query_stmt = None # type: Optional[str]
self._dependencies = None # type: Optional[FrozenSet[str]]
self._is_required = None # type: Union[None, bool]
评论列表
文章目录