Show topic distributions¶

Plot topic figures and show them.

Start with the necessary imports¶

from os.path import join

import numpy as np
import pandas as pd
from nilearn import plotting
from nilearn.masking import unmask

from gclda.model import Model
from gclda.utils import get_resource_path

Load model¶

model_file = join(get_resource_path(), 'models/Neurosynth2015Filtered2',
                  'model_200topics_2015Filtered2_10000iters.pklz')
model = Model.load(model_file)

Get spatial probability¶

p_voxel_g_topic, _ = model.get_spatial_probs()

Show topic 10¶

topic_no = 10
img = unmask(p_voxel_g_topic[:, topic_no], model.dataset.mask_img)

# Get strings giving top K words and probs for the current topic
wprobs = model.n_word_tokens_word_by_topic[:, topic_no] + model.beta
wprobs = wprobs / np.sum(wprobs)
word_probs = zip(*[model.dataset.word_labels, wprobs])
df = pd.DataFrame(columns=['term', 'probability'], data=word_probs)
df = df.sort_values(by='probability', ascending=False).reset_index(drop=True)
print df.head(12)

fig = plotting.plot_stat_map(img, display_mode='z')

auto_examples/02_general/images/sphx_glr_plot_show_topic_figures_001.png

Out:

term  probability
 cognitive_control     0.119603
           demands     0.071321
         executive     0.062462
         difficult     0.033669
              easy     0.024810
 executive_control     0.023924
         requiring     0.019938
         selection     0.018609
            number     0.016837
              hard     0.015951
           manner     0.015508
         matching     0.015065

Show topic 59¶

topic_no = 58
img = unmask(p_voxel_g_topic[:, topic_no], model.dataset.mask_img)

# Get strings giving top K words and probs for the current topic
wprobs = model.n_word_tokens_word_by_topic[:, topic_no] + model.beta
wprobs = wprobs / np.sum(wprobs)
word_probs = zip(*[model.dataset.word_labels, wprobs])
df = pd.DataFrame(columns=['term', 'probability'], data=word_probs)
df = df.sort_values(by='probability', ascending=False).reset_index(drop=True)
print df.head(12)

fig = plotting.plot_stat_map(img, display_mode='z')

auto_examples/02_general/images/sphx_glr_plot_show_topic_figures_002.png

Out:

term  probability
  somatosensory     0.135916
        tactile     0.108811
          touch     0.088289
    stimulation     0.048406
        sensory     0.039113
 discrimination     0.027496
           body     0.022850
   vibrotactile     0.014331
        touched     0.013556
         finger     0.013169
          skin     0.012395
     roughness     0.012008

Show topic 150¶

topic_no = 149
img = unmask(p_voxel_g_topic[:, topic_no], model.dataset.mask_img)

# Get strings giving top K words and probs for the current topic
wprobs = model.n_word_tokens_word_by_topic[:, topic_no] + model.beta
wprobs = wprobs / np.sum(wprobs)
word_probs = zip(*[model.dataset.word_labels, wprobs])
df = pd.DataFrame(columns=['term', 'probability'], data=word_probs)
df = df.sort_values(by='probability', ascending=False).reset_index(drop=True)
print df.head(12)

fig = plotting.plot_stat_map(img, display_mode='z')

auto_examples/02_general/images/sphx_glr_plot_show_topic_figures_003.png

Out:

term  probability
  emotional     0.120525
    emotion     0.064047
      faces     0.055130
  affective     0.027836
       fear     0.025134
    fearful     0.024594
   pictures     0.015136
 regulation     0.014055
     affect     0.013784
      angry     0.012704
    threat     0.012704
   ratings     0.012704

Total running time of the script: ( 0 minutes 41.400 seconds)

Gallery generated by Sphinx-Gallery