fiex 4 and 10, sorting csv's now and making sure the origin of duplication is always local instance if compared

This commit is contained in:
doctor_dev 2025-06-10 22:07:56 +00:00
parent 50f6a637cd
commit d78ed2bc86
No known key found for this signature in database
GPG key ID: F12F7F71CB84AEAA
5 changed files with 43 additions and 15 deletions

View file

@ -69,6 +69,8 @@ def clean_csv(df, blacklist):
try:
if not df.empty:
df = utils.sort_instances(df, 'Instance', conf.LOCAL_INSTANCE)
df = utils.remove_duplications(df)
df = df[~df.apply(lambda row: any(word in str(value) for word in blacklist for value in row), axis=1)]