plosone_underreview: tests/test_outliers.py comparison

return train/test sets in load_dataset

author	Maria Panteli <m.x.panteli@gmail.com>
date	Wed, 13 Sep 2017 12:53:57 +0100
parents	ed109218dd4b
children	e8084526f7e5

comparison

equal deleted inserted replaced

-:0bba6f63f4fd
+:65b9330afdd8
 import pytest
 import numpy as np
 import pandas as pd
+import pickle
+import os
 import scripts.outliers as outliers
 def test_country_outlier_df():
 outlier_counts_true = {'a':.5, 'b':1.}
 assert np.array_equal(outlier_counts, outlier_counts_true)
 def test_get_outliers_df():
-assert True
+np.random.seed(1)
+X = np.random.randn(100, 3)
+# create outliers by shifting the entries of the last 5 samples
+X[-5:, :] = X[-5:, :] + 10
+Y = np.concatenate([np.repeat('a', 95), np.repeat('b', 5)])
+df, threshold, MD = outliers.get_outliers_df(X, Y)
+# expect that items from country 'b' are detected as outliers
+assert np.array_equal(df['Outliers'].get_values(), np.array([0., 1.0]))

Mercurial > hg > plosone_underreview