DaveM@0
|
1 {
|
DaveM@0
|
2 "cells": [
|
DaveM@0
|
3 {
|
DaveM@0
|
4 "cell_type": "code",
|
DaveM@0
|
5 "execution_count": 1,
|
DaveM@0
|
6 "metadata": {
|
DaveM@0
|
7 "collapsed": false
|
DaveM@0
|
8 },
|
DaveM@0
|
9 "outputs": [],
|
DaveM@0
|
10 "source": [
|
DaveM@0
|
11 "from matplotlib import pyplot as plt\n",
|
DaveM@0
|
12 "from scipy.cluster.hierarchy import dendrogram, linkage, cophenet\n",
|
DaveM@0
|
13 "from scipy.spatial.distance import pdist\n",
|
DaveM@1
|
14 "import sklearn \n",
|
DaveM@0
|
15 "import numpy as np\n",
|
DaveM@0
|
16 "import csv\n",
|
DaveM@0
|
17 "\n",
|
DaveM@0
|
18 "dataFolder = '../data/'\n",
|
DaveM@0
|
19 "keyFile = 'AdobeNormalised'\n",
|
DaveM@0
|
20 "datapath = dataFolder + keyFile"
|
DaveM@0
|
21 ]
|
DaveM@0
|
22 },
|
DaveM@0
|
23 {
|
DaveM@0
|
24 "cell_type": "code",
|
DaveM@0
|
25 "execution_count": 2,
|
DaveM@0
|
26 "metadata": {
|
DaveM@0
|
27 "collapsed": true
|
DaveM@0
|
28 },
|
DaveM@0
|
29 "outputs": [],
|
DaveM@0
|
30 "source": [
|
DaveM@0
|
31 "X = np.genfromtxt(datapath+'.csv', delimiter = ',', skip_header = 1)\n",
|
DaveM@0
|
32 "filenames = np.loadtxt(datapath+'_filenames.csv', dtype = str)\n",
|
DaveM@0
|
33 "labels = np.loadtxt(datapath+'_labels.csv', dtype = str)\n",
|
DaveM@0
|
34 "features = np.loadtxt(datapath+'_features.csv', dtype = str)\n"
|
DaveM@0
|
35 ]
|
DaveM@0
|
36 },
|
DaveM@0
|
37 {
|
DaveM@0
|
38 "cell_type": "code",
|
DaveM@0
|
39 "execution_count": null,
|
DaveM@0
|
40 "metadata": {
|
DaveM@0
|
41 "collapsed": false
|
DaveM@0
|
42 },
|
DaveM@0
|
43 "outputs": [],
|
DaveM@0
|
44 "source": [
|
DaveM@1
|
45 "agglo = cluster.FeatureAgglomeration()\n",
|
DaveM@1
|
46 "agglo.fit(X)\n",
|
DaveM@1
|
47 "X_reduced = agglo.transform(X)"
|
DaveM@0
|
48 ]
|
DaveM@0
|
49 },
|
DaveM@0
|
50 {
|
DaveM@0
|
51 "cell_type": "code",
|
DaveM@0
|
52 "execution_count": null,
|
DaveM@0
|
53 "metadata": {
|
DaveM@0
|
54 "collapsed": false
|
DaveM@0
|
55 },
|
DaveM@0
|
56 "outputs": [],
|
DaveM@0
|
57 "source": [
|
DaveM@0
|
58 "Z = linkage(X)"
|
DaveM@0
|
59 ]
|
DaveM@0
|
60 },
|
DaveM@0
|
61 {
|
DaveM@0
|
62 "cell_type": "code",
|
DaveM@1
|
63 "execution_count": 18,
|
DaveM@1
|
64 "metadata": {
|
DaveM@1
|
65 "collapsed": false
|
DaveM@1
|
66 },
|
DaveM@1
|
67 "outputs": [
|
DaveM@1
|
68 {
|
DaveM@1
|
69 "name": "stdout",
|
DaveM@1
|
70 "output_type": "stream",
|
DaveM@1
|
71 "text": [
|
DaveM@1
|
72 "[[ 8.51810000e-01 4.00000000e-06 2.46000000e-04 ..., 2.10260000e-02\n",
|
DaveM@1
|
73 " 1.98220000e-02 1.04000000e-04]\n",
|
DaveM@1
|
74 " [ 9.52275000e-01 7.00000000e-06 1.82600000e-03 ..., 1.79490000e-02\n",
|
DaveM@1
|
75 " 1.09020000e-02 7.20000000e-05]\n",
|
DaveM@1
|
76 " [ 1.92200000e-03 1.00000000e-06 1.39000000e-04 ..., 2.35900000e-02\n",
|
DaveM@1
|
77 " 6.93800000e-03 2.61000000e-04]\n",
|
DaveM@1
|
78 " ..., \n",
|
DaveM@1
|
79 " [ 9.96346000e-01 3.37000000e-04 1.23600000e-03 ..., 5.24103000e-01\n",
|
DaveM@1
|
80 " 3.36967000e-01 5.39000000e-04]\n",
|
DaveM@1
|
81 " [ 9.99990000e-01 1.00000000e-06 0.00000000e+00 ..., 0.00000000e+00\n",
|
DaveM@1
|
82 " 0.00000000e+00 0.00000000e+00]\n",
|
DaveM@1
|
83 " [ 9.96624000e-01 6.97000000e-04 2.59300000e-03 ..., 5.24615000e-01\n",
|
DaveM@1
|
84 " 3.34985000e-01 5.45000000e-04]]\n"
|
DaveM@1
|
85 ]
|
DaveM@1
|
86 }
|
DaveM@1
|
87 ],
|
DaveM@1
|
88 "source": [
|
DaveM@1
|
89 "print X"
|
DaveM@1
|
90 ]
|
DaveM@1
|
91 },
|
DaveM@1
|
92 {
|
DaveM@1
|
93 "cell_type": "code",
|
DaveM@1
|
94 "execution_count": 29,
|
DaveM@1
|
95 "metadata": {
|
DaveM@1
|
96 "collapsed": false
|
DaveM@1
|
97 },
|
DaveM@1
|
98 "outputs": [
|
DaveM@1
|
99 {
|
DaveM@1
|
100 "name": "stdout",
|
DaveM@1
|
101 "output_type": "stream",
|
DaveM@1
|
102 "text": [
|
DaveM@1
|
103 "(8977, 1536)\n"
|
DaveM@1
|
104 ]
|
DaveM@1
|
105 }
|
DaveM@1
|
106 ],
|
DaveM@1
|
107 "source": []
|
DaveM@1
|
108 },
|
DaveM@1
|
109 {
|
DaveM@1
|
110 "cell_type": "code",
|
DaveM@1
|
111 "execution_count": 42,
|
DaveM@1
|
112 "metadata": {
|
DaveM@1
|
113 "collapsed": false
|
DaveM@1
|
114 },
|
DaveM@1
|
115 "outputs": [
|
DaveM@1
|
116 {
|
DaveM@1
|
117 "name": "stdout",
|
DaveM@1
|
118 "output_type": "stream",
|
DaveM@1
|
119 "text": [
|
DaveM@1
|
120 "{'nu_0': 0, 'kappa_0': 0, 'lambda_0': 0, 'mu_0': 0}\n"
|
DaveM@1
|
121 ]
|
DaveM@1
|
122 }
|
DaveM@1
|
123 ],
|
DaveM@1
|
124 "source": []
|
DaveM@1
|
125 },
|
DaveM@1
|
126 {
|
DaveM@1
|
127 "cell_type": "code",
|
DaveM@1
|
128 "execution_count": null,
|
DaveM@1
|
129 "metadata": {
|
DaveM@1
|
130 "collapsed": true
|
DaveM@1
|
131 },
|
DaveM@1
|
132 "outputs": [],
|
DaveM@1
|
133 "source": [
|
DaveM@1
|
134 "import pyBHC as bhc\n",
|
DaveM@1
|
135 "from pyBHC import dists\n",
|
DaveM@1
|
136 "\n",
|
DaveM@1
|
137 "mu_init = []\n",
|
DaveM@1
|
138 "sigma_init = []\n",
|
DaveM@1
|
139 "S_init = []\n",
|
DaveM@1
|
140 "cd = dists.NormalFixedCovar(mu_0=mu_init,sigma_0=sigma_init, S=S_init)\n",
|
DaveM@1
|
141 "\n",
|
DaveM@1
|
142 "# temp = cd.log_marginal_likelihood(X)\n",
|
DaveM@1
|
143 "d = bhc.rbhc(X, cd)"
|
DaveM@1
|
144 ]
|
DaveM@1
|
145 },
|
DaveM@1
|
146 {
|
DaveM@1
|
147 "cell_type": "code",
|
DaveM@1
|
148 "execution_count": null,
|
DaveM@1
|
149 "metadata": {
|
DaveM@1
|
150 "collapsed": true
|
DaveM@1
|
151 },
|
DaveM@1
|
152 "outputs": [],
|
DaveM@1
|
153 "source": [
|
DaveM@1
|
154 "\n",
|
DaveM@1
|
155 "\n"
|
DaveM@1
|
156 ]
|
DaveM@1
|
157 },
|
DaveM@1
|
158 {
|
DaveM@1
|
159 "cell_type": "code",
|
DaveM@1
|
160 "execution_count": null,
|
DaveM@1
|
161 "metadata": {
|
DaveM@1
|
162 "collapsed": true
|
DaveM@1
|
163 },
|
DaveM@1
|
164 "outputs": [],
|
DaveM@1
|
165 "source": []
|
DaveM@1
|
166 },
|
DaveM@1
|
167 {
|
DaveM@1
|
168 "cell_type": "code",
|
DaveM@1
|
169 "execution_count": null,
|
DaveM@1
|
170 "metadata": {
|
DaveM@1
|
171 "collapsed": true
|
DaveM@1
|
172 },
|
DaveM@1
|
173 "outputs": [],
|
DaveM@1
|
174 "source": []
|
DaveM@1
|
175 },
|
DaveM@1
|
176 {
|
DaveM@1
|
177 "cell_type": "code",
|
DaveM@0
|
178 "execution_count": null,
|
DaveM@0
|
179 "metadata": {
|
DaveM@0
|
180 "collapsed": true
|
DaveM@0
|
181 },
|
DaveM@0
|
182 "outputs": [],
|
DaveM@0
|
183 "source": []
|
DaveM@0
|
184 }
|
DaveM@0
|
185 ],
|
DaveM@0
|
186 "metadata": {
|
DaveM@0
|
187 "kernelspec": {
|
DaveM@0
|
188 "display_name": "Python 2",
|
DaveM@0
|
189 "language": "python",
|
DaveM@0
|
190 "name": "python2"
|
DaveM@0
|
191 },
|
DaveM@0
|
192 "language_info": {
|
DaveM@0
|
193 "codemirror_mode": {
|
DaveM@0
|
194 "name": "ipython",
|
DaveM@0
|
195 "version": 2
|
DaveM@0
|
196 },
|
DaveM@0
|
197 "file_extension": ".py",
|
DaveM@0
|
198 "mimetype": "text/x-python",
|
DaveM@0
|
199 "name": "python",
|
DaveM@0
|
200 "nbconvert_exporter": "python",
|
DaveM@0
|
201 "pygments_lexer": "ipython2",
|
DaveM@0
|
202 "version": "2.7.10"
|
DaveM@0
|
203 }
|
DaveM@0
|
204 },
|
DaveM@0
|
205 "nbformat": 4,
|
DaveM@0
|
206 "nbformat_minor": 0
|
DaveM@0
|
207 }
|