Mercurial > hg > from-my-pen-to-your-ears-supplementary-material
view results/data/saves/.ipynb_checkpoints/Untitled-checkpoint.ipynb @ 1:eb3b846ae0ef tip
second commit
author | Emmanouil Theofanis Chourdakis <e.t.chourdakis@qmul.ac.uk> |
---|---|
date | Wed, 16 May 2018 18:13:41 +0100 |
parents | 4dad87badb0c |
children |
line wrap: on
line source
{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import glob\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "sns.set(style=\"ticks\", color_codes=True, font_scale=1.3)\n", "\n", "page1_df = pd.read_csv('ratings/page1-default-ratings.csv').set_index('file_keys')\n", "page2_df = pd.read_csv('ratings/page2-default-ratings.csv').set_index('file_keys')\n", "page3_df = pd.read_csv('ratings/page3-default-ratings.csv').set_index('file_keys')\n", "page4_df = pd.read_csv('ratings/page4-default-ratings.csv').set_index('file_keys')\n", "page5_df = pd.read_csv('ratings/page5-default-ratings.csv').set_index('file_keys')\n", "page6_df = pd.read_csv('ratings/page6-default-ratings.csv').set_index('file_keys')\n", "page7_df = pd.read_csv('ratings/page7-default-ratings.csv').set_index('file_keys')\n", "page8_df = pd.read_csv('ratings/page8-default-ratings.csv').set_index('file_keys')\n", "page9_df = pd.read_csv('ratings/page9-default-ratings.csv').set_index('file_keys')" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "renamedict = {k: k[1:] for k in page1_df.columns}\n", "page1 = page1_df.rename(columns=renamedict)\n", "page1['story'] = 'a'\n", "renamedict = {k: k[1:] for k in page2_df.columns}\n", "page2 = page2_df.rename(columns=renamedict)\n", "page2['story'] = 'b'\n", "renamedict = {k: k[1:] for k in page3_df.columns}\n", "page3 = page3_df.rename(columns=renamedict)\n", "page3['story'] = 'c'\n", "renamedict = {k: k[1:] for k in page4_df.columns}\n", "page4 = page4_df.rename(columns=renamedict)\n", "page4['story'] = 'a'\n", "renamedict = {k: k[1:] for k in page5_df.columns}\n", "page5 = page5_df.rename(columns=renamedict)\n", "page5['story'] = 'b'\n", "renamedict = {k: k[1:] for k in page6_df.columns}\n", "page6 = page6_df.rename(columns=renamedict)\n", "page6['story'] = 'c'\n", "renamedict = {k: k[1:] for k in page7_df.columns}\n", "page7 = page7_df.rename(columns=renamedict)\n", "page7['story'] = 'a'\n", "renamedict = {k: k[1:] for k in page8_df.columns}\n", "page8 = page8_df.rename(columns=renamedict)\n", "page8['story'] = 'b'\n", "renamedict = {k: k[1:] for k in page9_df.columns}\n", "page9 = page9_df.rename(columns=renamedict)\n", "page9['story'] = 'c'\n" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "<div>\n", "<style scoped>\n", " .dataframe tbody tr th:only-of-type {\n", " vertical-align: middle;\n", " }\n", "\n", " .dataframe tbody tr th {\n", " vertical-align: top;\n", " }\n", "\n", " .dataframe thead th {\n", " text-align: right;\n", " }\n", "</style>\n", "<table border=\"1\" class=\"dataframe\">\n", " <thead>\n", " <tr style=\"text-align: right;\">\n", " <th></th>\n", " <th>0000</th>\n", " <th>0011</th>\n", " <th>1011</th>\n", " <th>1101</th>\n", " <th>1110</th>\n", " <th>1111</th>\n", " <th>story</th>\n", " </tr>\n", " <tr>\n", " <th>file_keys</th>\n", " <th></th>\n", " <th></th>\n", " <th></th>\n", " <th></th>\n", " <th></th>\n", " <th></th>\n", " <th></th>\n", " </tr>\n", " </thead>\n", " <tbody>\n", " <tr>\n", " <th>IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi</th>\n", " <td>0.06</td>\n", " <td>0.13</td>\n", " <td>0.68</td>\n", " <td>0.71</td>\n", " <td>0.65</td>\n", " <td>0.65</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t</th>\n", " <td>0.00</td>\n", " <td>0.04</td>\n", " <td>0.95</td>\n", " <td>1.00</td>\n", " <td>0.80</td>\n", " <td>0.95</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD</th>\n", " <td>0.24</td>\n", " <td>0.24</td>\n", " <td>0.76</td>\n", " <td>0.75</td>\n", " <td>1.00</td>\n", " <td>0.76</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.83</td>\n", " <td>0.97</td>\n", " <td>0.86</td>\n", " <td>0.90</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>9UODgpqx7pTDhiiLm7ds39wh59aYBrHK</th>\n", " <td>0.06</td>\n", " <td>0.20</td>\n", " <td>0.72</td>\n", " <td>0.77</td>\n", " <td>0.55</td>\n", " <td>0.91</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>VyX492RQzqQXRL84PByL9pLt8C5p4c50</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.63</td>\n", " <td>0.87</td>\n", " <td>0.84</td>\n", " <td>1.00</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>bkHwhN78d7k2kIanOievgityZQD7gVOr</th>\n", " <td>0.08</td>\n", " <td>0.25</td>\n", " <td>0.93</td>\n", " <td>0.98</td>\n", " <td>0.78</td>\n", " <td>0.92</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>bKhIcFzfZ3YXPxNiw4E7kFyoTFAqeFTp</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>0.76</td>\n", " <td>1.00</td>\n", " <td>0.77</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1</th>\n", " <td>0.09</td>\n", " <td>0.10</td>\n", " <td>0.92</td>\n", " <td>0.91</td>\n", " <td>0.09</td>\n", " <td>0.92</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>0.97</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>YMVW8vVq8kZbGFRMWn9ElJBJ38bVV5GU</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.95</td>\n", " <td>0.42</td>\n", " <td>0.92</td>\n", " <td>0.93</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ</th>\n", " <td>0.00</td>\n", " <td>0.14</td>\n", " <td>0.70</td>\n", " <td>0.54</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>OK2yLWD54tr3klqiS631VXjQlroZfmD3</th>\n", " <td>0.06</td>\n", " <td>0.03</td>\n", " <td>0.52</td>\n", " <td>1.00</td>\n", " <td>0.68</td>\n", " <td>0.89</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>t1Ybl1O1EAdpBEbxOLbaU4QlHtAcGCxa</th>\n", " <td>0.09</td>\n", " <td>0.11</td>\n", " <td>1.00</td>\n", " <td>0.99</td>\n", " <td>0.65</td>\n", " <td>0.54</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>JZaBaWCeuGjSAyoUrfwdASaIHXkHCZml</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.71</td>\n", " <td>0.83</td>\n", " <td>0.84</td>\n", " <td>0.93</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o</th>\n", " <td>0.23</td>\n", " <td>0.23</td>\n", " <td>0.62</td>\n", " <td>1.00</td>\n", " <td>0.79</td>\n", " <td>0.84</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT</th>\n", " <td>0.11</td>\n", " <td>0.24</td>\n", " <td>0.69</td>\n", " <td>1.00</td>\n", " <td>0.66</td>\n", " <td>0.83</td>\n", " <td>a</td>\n", " </tr>\n", " <tr>\n", " <th>IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi</th>\n", " <td>0.01</td>\n", " <td>0.02</td>\n", " <td>0.70</td>\n", " <td>0.68</td>\n", " <td>0.79</td>\n", " <td>0.75</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD</th>\n", " <td>0.00</td>\n", " <td>0.24</td>\n", " <td>0.76</td>\n", " <td>0.76</td>\n", " <td>0.76</td>\n", " <td>1.00</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.96</td>\n", " <td>0.91</td>\n", " <td>0.92</td>\n", " <td>0.92</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>9UODgpqx7pTDhiiLm7ds39wh59aYBrHK</th>\n", " <td>0.20</td>\n", " <td>0.29</td>\n", " <td>0.60</td>\n", " <td>0.96</td>\n", " <td>0.70</td>\n", " <td>0.81</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>VyX492RQzqQXRL84PByL9pLt8C5p4c50</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>0.81</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>bKhIcFzfZ3YXPxNiw4E7kFyoTFAqeFTp</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>0.75</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1</th>\n", " <td>0.13</td>\n", " <td>0.08</td>\n", " <td>0.86</td>\n", " <td>0.95</td>\n", " <td>0.74</td>\n", " <td>0.76</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.97</td>\n", " <td>0.99</td>\n", " <td>1.00</td>\n", " <td>0.61</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.49</td>\n", " <td>1.00</td>\n", " <td>0.65</td>\n", " <td>0.82</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>OK2yLWD54tr3klqiS631VXjQlroZfmD3</th>\n", " <td>0.00</td>\n", " <td>0.03</td>\n", " <td>0.95</td>\n", " <td>1.00</td>\n", " <td>0.83</td>\n", " <td>0.83</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>t1Ybl1O1EAdpBEbxOLbaU4QlHtAcGCxa</th>\n", " <td>0.00</td>\n", " <td>0.15</td>\n", " <td>0.48</td>\n", " <td>0.76</td>\n", " <td>0.74</td>\n", " <td>0.87</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>D0Fq5YbSHwHaHK9V5pIWlIg5T6Ji3fQH</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.98</td>\n", " <td>0.74</td>\n", " <td>0.92</td>\n", " <td>0.91</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o</th>\n", " <td>0.09</td>\n", " <td>0.10</td>\n", " <td>0.77</td>\n", " <td>1.00</td>\n", " <td>0.90</td>\n", " <td>1.00</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT</th>\n", " <td>0.12</td>\n", " <td>0.11</td>\n", " <td>0.77</td>\n", " <td>0.92</td>\n", " <td>1.00</td>\n", " <td>0.90</td>\n", " <td>b</td>\n", " </tr>\n", " <tr>\n", " <th>IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi</th>\n", " <td>0.02</td>\n", " <td>0.01</td>\n", " <td>0.87</td>\n", " <td>0.98</td>\n", " <td>0.87</td>\n", " <td>0.93</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.97</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD</th>\n", " <td>0.00</td>\n", " <td>0.24</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq</th>\n", " <td>0.00</td>\n", " <td>0.00</td>\n", " <td>0.72</td>\n", " <td>0.85</td>\n", " <td>0.88</td>\n", " <td>0.66</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>VyX492RQzqQXRL84PByL9pLt8C5p4c50</th>\n", " <td>0.02</td>\n", " <td>0.00</td>\n", " <td>0.93</td>\n", " <td>0.82</td>\n", " <td>0.97</td>\n", " <td>0.83</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>bkHwhN78d7k2kIanOievgityZQD7gVOr</th>\n", " <td>0.18</td>\n", " <td>0.23</td>\n", " <td>0.89</td>\n", " <td>0.92</td>\n", " <td>0.95</td>\n", " <td>0.90</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1</th>\n", " <td>0.07</td>\n", " <td>0.11</td>\n", " <td>0.77</td>\n", " <td>0.93</td>\n", " <td>0.87</td>\n", " <td>0.93</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz</th>\n", " <td>0.01</td>\n", " <td>0.00</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>0.97</td>\n", " <td>0.75</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ</th>\n", " <td>0.20</td>\n", " <td>0.20</td>\n", " <td>0.60</td>\n", " <td>1.00</td>\n", " <td>1.00</td>\n", " <td>0.75</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>OK2yLWD54tr3klqiS631VXjQlroZfmD3</th>\n", " <td>0.00</td>\n", " <td>0.07</td>\n", " <td>0.91</td>\n", " <td>0.97</td>\n", " <td>0.84</td>\n", " <td>0.73</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>D0Fq5YbSHwHaHK9V5pIWlIg5T6Ji3fQH</th>\n", " <td>0.10</td>\n", " <td>0.29</td>\n", " <td>0.51</td>\n", " <td>0.95</td>\n", " <td>0.52</td>\n", " <td>0.87</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>KBKzd0PezF8bsGoEZTkVkpmj1o8OECIo</th>\n", " <td>0.12</td>\n", " <td>0.66</td>\n", " <td>0.28</td>\n", " <td>0.05</td>\n", " <td>0.54</td>\n", " <td>0.44</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o</th>\n", " <td>0.12</td>\n", " <td>0.14</td>\n", " <td>0.77</td>\n", " <td>1.00</td>\n", " <td>0.95</td>\n", " <td>0.97</td>\n", " <td>c</td>\n", " </tr>\n", " <tr>\n", " <th>lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT</th>\n", " <td>0.24</td>\n", " <td>0.12</td>\n", " <td>0.89</td>\n", " <td>0.82</td>\n", " <td>0.69</td>\n", " <td>0.90</td>\n", " <td>c</td>\n", " </tr>\n", " </tbody>\n", "</table>\n", "</div>" ], "text/plain": [ " 0000 0011 1011 1101 1110 1111 story\n", "file_keys \n", "IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi 0.06 0.13 0.68 0.71 0.65 0.65 a\n", "iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t 0.00 0.04 0.95 1.00 0.80 0.95 a\n", "bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD 0.24 0.24 0.76 0.75 1.00 0.76 a\n", "U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq 0.00 0.00 0.83 0.97 0.86 0.90 a\n", "9UODgpqx7pTDhiiLm7ds39wh59aYBrHK 0.06 0.20 0.72 0.77 0.55 0.91 a\n", "VyX492RQzqQXRL84PByL9pLt8C5p4c50 0.00 0.00 0.63 0.87 0.84 1.00 a\n", "bkHwhN78d7k2kIanOievgityZQD7gVOr 0.08 0.25 0.93 0.98 0.78 0.92 a\n", "bKhIcFzfZ3YXPxNiw4E7kFyoTFAqeFTp 0.00 0.00 1.00 0.76 1.00 0.77 a\n", "ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1 0.09 0.10 0.92 0.91 0.09 0.92 a\n", "fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz 0.00 0.00 1.00 1.00 1.00 0.97 a\n", "YMVW8vVq8kZbGFRMWn9ElJBJ38bVV5GU 0.00 0.00 0.95 0.42 0.92 0.93 a\n", "G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ 0.00 0.14 0.70 0.54 1.00 1.00 a\n", "OK2yLWD54tr3klqiS631VXjQlroZfmD3 0.06 0.03 0.52 1.00 0.68 0.89 a\n", "t1Ybl1O1EAdpBEbxOLbaU4QlHtAcGCxa 0.09 0.11 1.00 0.99 0.65 0.54 a\n", "JZaBaWCeuGjSAyoUrfwdASaIHXkHCZml 0.00 0.00 0.71 0.83 0.84 0.93 a\n", "uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o 0.23 0.23 0.62 1.00 0.79 0.84 a\n", "lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT 0.11 0.24 0.69 1.00 0.66 0.83 a\n", "IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi 0.01 0.02 0.70 0.68 0.79 0.75 b\n", "iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t 0.00 0.00 1.00 1.00 1.00 1.00 b\n", "bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD 0.00 0.24 0.76 0.76 0.76 1.00 b\n", "U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq 0.00 0.00 0.96 0.91 0.92 0.92 b\n", "9UODgpqx7pTDhiiLm7ds39wh59aYBrHK 0.20 0.29 0.60 0.96 0.70 0.81 b\n", "VyX492RQzqQXRL84PByL9pLt8C5p4c50 0.00 0.00 1.00 1.00 1.00 0.81 b\n", "bKhIcFzfZ3YXPxNiw4E7kFyoTFAqeFTp 0.00 0.00 1.00 0.75 1.00 1.00 b\n", "ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1 0.13 0.08 0.86 0.95 0.74 0.76 b\n", "fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz 0.00 0.00 0.97 0.99 1.00 0.61 b\n", "G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ 0.00 0.00 0.49 1.00 0.65 0.82 b\n", "OK2yLWD54tr3klqiS631VXjQlroZfmD3 0.00 0.03 0.95 1.00 0.83 0.83 b\n", "t1Ybl1O1EAdpBEbxOLbaU4QlHtAcGCxa 0.00 0.15 0.48 0.76 0.74 0.87 b\n", "D0Fq5YbSHwHaHK9V5pIWlIg5T6Ji3fQH 0.00 0.00 0.98 0.74 0.92 0.91 b\n", "uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o 0.09 0.10 0.77 1.00 0.90 1.00 b\n", "lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT 0.12 0.11 0.77 0.92 1.00 0.90 b\n", "IXHrDvdwYoDCO7bvwRMB7jD46hoWAjDi 0.02 0.01 0.87 0.98 0.87 0.93 c\n", "iWogwaa7GooHWHcp8C0ZjRrTMDgcae0t 0.00 0.00 0.97 1.00 1.00 1.00 c\n", "bOyRMU1QCcMqMpcjcHNBuVMF45oksQMD 0.00 0.24 1.00 1.00 1.00 1.00 c\n", "U6mgdJX1DgAfYJ6DR7sKY0CL4YgcwZKq 0.00 0.00 0.72 0.85 0.88 0.66 c\n", "VyX492RQzqQXRL84PByL9pLt8C5p4c50 0.02 0.00 0.93 0.82 0.97 0.83 c\n", "bkHwhN78d7k2kIanOievgityZQD7gVOr 0.18 0.23 0.89 0.92 0.95 0.90 c\n", "ufohn9b31ZNI2zLGNqmmRYOMtIwiw6o1 0.07 0.11 0.77 0.93 0.87 0.93 c\n", "fZGbsBmuEtrB35G2IzQu0IxOCVoljWpz 0.01 0.00 1.00 1.00 0.97 0.75 c\n", "G2WO7k3tSjvBrlMG1Nqz4DsKBO8oaEcQ 0.20 0.20 0.60 1.00 1.00 0.75 c\n", "OK2yLWD54tr3klqiS631VXjQlroZfmD3 0.00 0.07 0.91 0.97 0.84 0.73 c\n", "D0Fq5YbSHwHaHK9V5pIWlIg5T6Ji3fQH 0.10 0.29 0.51 0.95 0.52 0.87 c\n", "KBKzd0PezF8bsGoEZTkVkpmj1o8OECIo 0.12 0.66 0.28 0.05 0.54 0.44 c\n", "uoBPmOWdbNI4uowtBZRZK8BIEUVvUn1o 0.12 0.14 0.77 1.00 0.95 0.97 c\n", "lIOWKvmCLdlUhGFYwE3lOfizSeqtxyNT 0.24 0.12 0.89 0.82 0.69 0.90 c" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "task1_df = page1.append(page2).append(page3)\n", "task2_df = page4.append(page5).append(page6)\n", "task3_df = page7.append(page8).append(page9)\n", "\n", "def transform_df(df):\n", " records = []\n", " for n in range(len(df)):\n", " for c in df.columns:\n", " if c not in ['file_keys', 'story']:\n", " records.append({\n", " 'stimulus': c,\n", " 'story': df['story'].iloc[n],\n", " 'preference': df[c].iloc[n]\n", " \n", " })\n", " \n", " return pd.DataFrame.from_records(records)\n", " \n", "task1_df" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "task1_transformed = transform_df(task1_df)\n", "task2_transformed = transform_df(task2_df)\n", "task3_transformed = transform_df(task3_df)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "<matplotlib.figure.Figure at 0x7f8053549c18>" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "fig, axes = plt.subplots(nrows=4, ncols=4)" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "from matplotlib import gridspec\n", "#sns.set(font_scale=1.3)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "<matplotlib.figure.Figure at 0x7f80511c4208>" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "#sns.set(style=\"whitegrid\", color_codes=True)\n", "fig = plt.figure(figsize=(5,5))\n", "gs = gridspec.GridSpec(2,1,height_ratios=[2,1])\n", "plt.subplot(gs[0])\n", "g = sns.boxplot(data=task1_transformed, x='stimulus', y='preference', hue='story', width=0.8, palette={'a':'red','b':'yellow','c':'cyan'})\n", "g.set_ylabel('individual')\n", "g.set(xticklabels=[], xlabel='',)\n", "g.set_xticks([])\n", "plt.subplot(gs[1])\n", "g2 = sns.boxplot(data=task1_transformed, x='stimulus', y='preference', width=0.6, palette='gray')\n", "g2.set_ylabel('aggregate')\n", "for box in g2.artists:\n", " box.set_facecolor(\"magenta\")\n", "fig.tight_layout()\n", "plt.savefig('task1.pdf', dpi=300,bbox_inches='tight')" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "<matplotlib.figure.Figure at 0x7f8050e212e8>" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "fig = plt.figure(figsize=(5,5))\n", "gs = gridspec.GridSpec(2,1,height_ratios=[2,1])\n", "plt.subplot(gs[0])\n", "\n", "g = sns.boxplot(data=task2_transformed, x='stimulus', y='preference', hue='story', width=0.8, palette={'a':'red','b':'yellow','c':'cyan'})\n", "sns.set_style({'legend.frameon':False})\n", "g.set_ylabel('individual')\n", "g.set(xticklabels=[], xlabel='',)\n", "g.set_xticks([])\n", "g.set(yticklabels=[], ylabel='',)\n", "g.set_yticks([])\n", "\n", "plt.subplot(gs[1])\n", "g2 = sns.boxplot(data=task2_transformed, x='stimulus', y='preference', width=0.6, palette='gray')\n", "g2.set_ylabel('aggregate')\n", "g2.set(yticklabels=[], ylabel='',)\n", "g2.set_yticks([])\n", "for box in g2.artists:\n", " box.set_facecolor(\"magenta\")\n", "fig.tight_layout()\n", "plt.savefig('task2.pdf', dpi=300,bbox_inches='tight')" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "<matplotlib.figure.Figure at 0x7f8050e93198>" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "#sns.set(style=\"whitegrid\", color_codes=True)\n", "fig = plt.figure(figsize=(5,5))\n", "gs = gridspec.GridSpec(2,1,height_ratios=[2,1])\n", "plt.subplot(gs[0])\n", "g = sns.boxplot(data=task3_transformed, x='stimulus', y='preference', hue='story', width=0.8, palette={'a':'red','b':'yellow','c':'cyan'})\n", "g.set_ylabel('individual')\n", "g.set(xticklabels=[], xlabel='',)\n", "g.set_xticks([])\n", "\n", "g.set(yticklabels=[], ylabel='',)\n", "g.set_yticks([])\n", "plt.subplot(gs[1])\n", "g2 = sns.boxplot(data=task3_transformed, x='stimulus', y='preference', width=0.6, palette='gray')\n", "g2.set_ylabel('aggregate')\n", "\n", "g2.set(yticklabels=[], ylabel='')\n", "g2.set_yticks([])\n", "g2.legend('')\n", "for box in g2.artists:\n", " box.set_facecolor(\"magenta\")\n", "fig.tight_layout()\n", "plt.savefig('task3.pdf', dpi=300, bbox_inches='tight')" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [ { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAhAAAABQCAYAAABIx0zMAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMS4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvNQv5yAAAAzdJREFUeJzt3b+KXGUcxvHfOInbLKx/smAwjRg8RWwtU1jZ2QreQcBCryCxsLDzEmwXwcZbSJcrOKCkiVioMcssMWtcj412GuYZ9/XNOfv5VFvMC88LO/CFc2BW0zQVAEDihd4DAID5ERAAQExAAAAxAQEAxAQEABATEABATEAAADEBAQDEBAQAEBMQAEDsUnpgGIa9qnqnqn6oqrNzXwQA/J/WVXW1qu6N43i67aFnBsQwDHeq6vZ/2wUAzMDNqrq77YdX6Y9pDcPwZlV9+8XjX+twoT/EdeuDz3tPaOrKjS97T2jq3a/e7z2hmQ9vfNJ7QlPTx2/3ntDUNx897j2hqffe+qz3hKa+Przfe0ITm82mjo6Oqqquj+P43bbn4kcY9ddji8NpqtcWGhDr/Vd7T2jq8iuXe09o6uDFl3pPaOba/u+9JzQ1XVv2a1kv7616T2jq9f0rvSc0dXDwsPeE1qLXEpb9bQUAmhAQAEBMQAAAMQEBAMQEBAAQExAAQExAAAAxAQEAxAQEABATEABATEAAADEBAQDEBAQAEBMQAEBMQAAAMQEBAMQEBAAQExAAQExAAAAxAQEAxAQEABATEABATEAAADEBAQDEBAQAEBMQAEBMQAAAMQEBAMQEBAAQExAAQExAAAAxAQEAxAQEABATEABATEAAADEBAQDEBAQAEBMQAEBMQAAAMQEBAMQEBAAQExAAQExAAAAxAQEAxAQEABATEABATEAAADEBAQDEBAQAEBMQAEBMQAAAsUs7nFlXVf24Wp3zlOfH2cnPvSc09fTh094Tmjr+7VHvCc08ONnlKzsf04M/ek9o6pfTqfeEpr4/+an3hKaOj497T2his9n8/ec6Obeapn//hx6G4U5V3d55FQAwFzfHcby77YefGRD/ZBiGvap6UlXXq+os2zYb96vqjd4jGnK/+Vry3arcb+7cb57WVXW1qu6N43i67aE4IKqqhmGYxnFc7DMM95u3Jd9vyXercr+5c7+LxUuUAEBMQAAAMQEBAMR2DYhPz3XF88f95m3J91vy3arcb+7c7wLZ6SVKAOBi8wgDAIgJCAAgJiAAgJiAAABiAgIAiP0JwuSVW1Zv18wAAAAASUVORK5CYII=\n", "text/plain": [ "<matplotlib.figure.Figure at 0x7f80901d0080>" ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "text/plain": [ "[(0.8941176470588235, 0.10196078431372557, 0.10980392156862737),\n", " (0.21568627450980393, 0.4941176470588236, 0.7215686274509804),\n", " (0.3019607843137256, 0.6862745098039216, 0.29019607843137263),\n", " (0.5960784313725492, 0.3058823529411765, 0.6392156862745098),\n", " (1.0, 0.4980392156862745, 0.0),\n", " (0.9999999999999998, 1.0, 0.19999999999999996),\n", " (0.6509803921568629, 0.33725490196078434, 0.1568627450980391),\n", " (0.9686274509803922, 0.5058823529411766, 0.7490196078431374),\n", " (0.6, 0.6, 0.6)]" ] }, "execution_count": 10, "metadata": {}, "output_type": "execute_result" } ], "source": [ "sns.choose_colorbrewer_palette('qualitative')" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.4" } }, "nbformat": 4, "nbformat_minor": 2 }