changeset 103:7a8d043d2d45 branch-tests

more on metadata for public code
author Maria Panteli
date Thu, 05 Oct 2017 11:47:26 +0100
parents d6c937bc1531
children 2f6e687938e2
files scripts/add_collection.py
diffstat 1 files changed, 21 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/scripts/add_collection.py	Thu Oct 05 11:47:26 2017 +0100
@@ -0,0 +1,21 @@
+import numpy as np
+import pandas as pd
+import pickle 
+import os
+
+
+METADATA_FILE = '../../music-outliers/data/metadata.csv'
+#METADATA_FILE = '../data/metadata.csv'
+
+df = pd.read_csv(METADATA_FILE)
+
+collection = []
+for audio in df['Audio']:
+    if 'SampleAudio' in audio:
+        collection.append('Smithsonian Folkways')
+    else:
+        collection.append('British Library')
+collection = np.array(collection)
+df['Collection'] = collection
+
+df.to_csv('../../music-outliers/data/metadata_2.csv', index=False)