1021 add flexable attr control

This commit is contained in:
FelixChan
2025-10-21 15:27:03 +08:00
parent d6b68ef90b
commit b493ede479
15 changed files with 400 additions and 394 deletions

View File

@ -61,7 +61,7 @@ class Corpus2Event():
# remove the corpus files that are already in the out_dir
# Use set for faster existence checks
existing_files = set(f.name for f in self.out_dir.glob("*.pkl"))
# corpus_list = [corpus for corpus in corpus_list if corpus.name not in existing_files]
corpus_list = [corpus for corpus in corpus_list if corpus.name not in existing_files]
for filepath_name, event in tqdm(map(self._load_single_corpus_and_make_event, corpus_list), total=len(corpus_list)):
if event is None:
broken_count += 1