import joblib import json with open('data/processed/go_terms.json') as f: go_data = json.load(f) from sklearn.preprocessing import MultiLabelBinarizer mlb = MultiLabelBinarizer() mlb.fit([list(go_data['go_to_idx'].keys())]) joblib.dump(mlb, 'mlb_public_v1.pkl')