filename = "calmos1976dvdripxvidavi upd" print(extract_features(filename)) This could output:
{ 'title': 'calmos', 'year': '1976', 'source': 'dvdrip', 'codec': 'xvid', 'file_format': 'avi', 'update_status': 'yes' } calmos1976dvdripxvidavi upd
def extract_features(filename): features = {} parts = filename.split('dvdrip')[0] features['title'] = parts.split('20')[0].strip() features['year'] = parts.split('20')[-1].strip() if '20' in parts else None features['source'] = 'dvdrip' features['codec'] = filename.split('xvid')[0].split()[-1] if 'xvid' in filename else None features['file_format'] = 'avi' if '.avi' in filename or 'avi' in filename.split() else None features['update_status'] = 'yes' if 'upd' in filename else 'no' return features calmos1976dvdripxvidavi upd