import logging
import os
os.environ["CUDA_VISIBLE_DEVICES"] = "1"
from collections import defaultdict
from pathlib import Path

import flashy.logging
import flashy.utils
import mne
import numpy as np
import pandas as pd
import torch
import bm
from bm import play
from bm.losses import ClipLoss
from bm.train import main
from omegaconf import OmegaConf
from torch.utils.data import ConcatDataset, DataLoader, TensorDataset
from scripts.run_eval_probs import _get_extra_info, _load_test_data, EvalJob, Evaluator, run_eval
logger = logging.getLogger(__name__)

selection = {'study': 'gwilliams2022'}
recording_lists = list(bm.studies.from_selection(selection))
sample_recording = recording_lists[0]
print("# of recording:",len(recording_lists))
recording_lists[:10]

# of recording: 196

[Gwilliams2022Recording('01_session0_story0'),
 Gwilliams2022Recording('01_session0_story1'),
 Gwilliams2022Recording('01_session0_story2'),
 Gwilliams2022Recording('01_session0_story3'),
 Gwilliams2022Recording('01_session1_story0'),
 Gwilliams2022Recording('01_session1_story1'),
 Gwilliams2022Recording('01_session1_story2'),
 Gwilliams2022Recording('01_session1_story3'),
 Gwilliams2022Recording('02_session0_story0'),
 Gwilliams2022Recording('02_session0_story1')]

sample_recording.mne_info

bids_path: /ssd3/other/penglinkai01/brainmagick/data/gwilliams2022/download/sub-01/ses-0/meg/sub-01_ses-0_task-0_meg.con
Extracting SQD Parameters from /ssd3/other/penglinkai01/brainmagick/data/gwilliams2022/download/sub-01/ses-0/meg/sub-01_ses-0_task-0_meg.con...
Creating Raw.info structure...
Setting channel info structure...
Creating Info structure...
Ready.
Reading events from /ssd3/other/penglinkai01/brainmagick/data/gwilliams2022/download/sub-01/ses-0/meg/sub-01_ses-0_task-0_events.tsv.
Reading channel info from /ssd3/other/penglinkai01/brainmagick/data/gwilliams2022/download/sub-01/ses-0/meg/sub-01_ses-0_task-0_channels.tsv.
The stimulus channel "STI 014" is present in the raw data, but not included in channels.tsv. Removing the channel.
NOTE: pick_types() is a legacy function. New code should use inst.pick(...).
NOTE: pick_types() is a legacy function. New code should use inst.pick(...).

/ssd3/other/penglinkai01/brainmagick/bm/studies/gwilliams2022.py:106: RuntimeWarning: The unit for channel(s) MISC 001, MISC 002, MISC 003, MISC 004, MISC 005, MISC 006, MISC 007, MISC 008, MISC 009, MISC 010, MISC 011, MISC 012, MISC 013, MISC 014, MISC 015, MISC 016, MISC 017, MISC 018, MISC 019, MISC 020, MISC 021, MISC 022, MISC 023, MISC 024, MISC 025, MISC 026, MISC 027, MISC 028, MISC 029, MISC 030, MISC 031, MISC 032 has changed from V to NA.
  raw = read_raw_bids(bids_path)  # FIXME this is NOT a lazy read

sample_recording.raw().get_data().shape

(208, 396000)

sample_recording.events()[:5] # load when first access. see bm.studies.api.Recording method events()

uid = (sample_recording.__class__.__name__, sample_recording.subject_uid)
uid

('Gwilliams2022Recording', '01')

sample_recording.events()[sample_recording.events().kind == 'word']

low_mne = bm.studies.api.preprocess_mne(sample_recording.raw(),sample_rate=120,highpass=0)
sample_recording._cache_folder = Path("cache/studies/gwilliams2022/01_session0_story0")
bm.dataset._preload(sample_recording, sample_rate=120, highpass=0)
low_mne

Creating RawArray with float64 data, n_channels=208, n_times=47520
    Range : 0 ... 47519 =      0.000 ...   395.992 secs
Ready.
Opening raw data file cache/studies/gwilliams2022/01_session0_story0/meg-sr120-hp0-raw.fif...
Isotrak not found
    Range : 0 ... 47519 =      0.000 ...   395.992 secs
Ready.

low_mne.get_data().shape

(208, 47520)

test_ratio, valid_ratio = 0.2, 0.1
min_block_duration = 6
min_n_blocks_per_split = 1
sample_rate = 120
highpass=0
tmin, tmax = -0.5, 2.5
meg_dimension = max(recording.meg_dimension for recording in [sample_recording])
factory_kwargs = {}
factory_kwargs.update(sample_rate=sample_rate, highpass=highpass, meg_dimension=meg_dimension,baseline=None)
fact = bm.dataset.SegmentDataset.Factory(**factory_kwargs)

# we only use one example for probe
for i, recording in enumerate([sample_recording]):
    events = recording.events()
    blocks = events[events.kind == 'block']
    blocks = blocks.event.merge_blocks(min_block_duration_s=min_block_duration)
    blocks = bm.dataset.assign_blocks(blocks, [test_ratio, valid_ratio], seed=12, min_n_blocks_per_split=min_n_blocks_per_split)

    # start-stops
    # [(0.0, 29.756), (29.756, 40.096), (40.096, 68.416), ...]
    start_stops = [(b.start, b.start + b.duration) for b in blocks.itertuples()]
    
    # following code are same as "fact.apply(recording, blocks=start_stops)"
    data = recording.preprocessed(sample_rate, highpass=highpass)
    sample_rate = bm.utils.Frequency(data.info["sfreq"])
    times = np.arange(0, data.times[-1], 3.0)
    events = recording.events().copy()
    events = events.sort_values('start')
    delta = 0.5 / sample_rate
    mask = np.logical_and(times + tmin >= 0, times + tmax < data.times[-1] + delta)
    print("Mask(raw):",mask.sum())
    in_any_split = False
    counter = 0

    for start, stop in start_stops:
        in_split = times + tmin >= start
        margin = tmax - delta
        in_split &= times + margin < stop
        in_any_split |= in_split
    mask &= in_any_split
    samples = sample_rate.to_ind(times[mask])
    unique_samples = np.unique(samples)
    print("Mask(processed):",mask.sum())
    print("# of unique_samples:",len(unique_samples))

Mask(raw): 131
Mask(processed): 104
# of unique_samples: 104

blocks[:3]

from IPython.display import Audio, display
display(Audio(filename="lw1_0_clip.wav", rate=16000))

sig = "97d170e1"

logger.info(f"Loading solver {sig}")
mne.set_log_level(False)
flashy.logging.setup_logging(with_file_log=False)
solver = play.get_solver_from_sig(sig, override_cfg={})
solver.model.eval()
solver.loss.eval()

xp._argv_cache: /ssd3/other/penglinkai01/brainmagick/outputs/xps/97d170e1/.argv.json

[11-14 22:38:21][bm.play][INFO] - Loading solver from XP 97d170e1. Overrides used: ['dset.selections=[gwilliams2022]']
[11-14 22:38:21][bm._env][WARNING] - Hostname gpu226.corp.yodao.com not defined in /conf/study_paths/study_paths.yaml. Using default paths.
[11-14 22:38:21][bm.dataset][WARNING] - Requested 1000 recordings but only found 196
[11-14 22:38:33][bm.dataset][INFO] - Loading Subjects | 39/196 | 5.48 it/sec
[11-14 22:38:39][bm.dataset][INFO] - Loading Subjects | 78/196 | 5.71 it/sec
[11-14 22:38:46][bm.dataset][INFO] - Loading Subjects | 117/196 | 5.68 it/sec
[11-14 22:38:53][bm.dataset][INFO] - Loading Subjects | 156/196 | 5.75 it/sec
[11-14 22:38:59][bm.dataset][INFO] - Loading Subjects | 195/196 | 5.74 it/sec
[11-14 22:38:59][bm.dataset][INFO] - # Examples (train | valid | test): 203152 | 35156 | 69972
[11-14 22:39:01][bm.train][INFO] - Model hash: ed97b0fbdffe06faf696d2eecaacb57b143fd68d
/ssd3/other/penglinkai01/miniconda3/envs/bm/lib/python3.8/site-packages/flashy/loggers/tensorboard.py:47: UserWarning: tensorboard package was not found: use pip install tensorboard
  warnings.warn("tensorboard package was not found: use pip install tensorboard")

ClipLoss()

datasets = solver.datasets.test.datasets # [bm.dataset.SegmentDataset,bm.dataset.SegmentDataset,bm.dataset.SegmentDataset,...]
print("len(datasets):",len(datasets))
dataset = ConcatDataset(datasets)
loader = DataLoader(dataset, num_workers=0, batch_size=8, collate_fn=bm.dataset.SegmentBatch.collate_fn)
sample_rate = 120

len(datasets): 196

batch = next(iter(loader))
# see bm.dataset.Segmentbatch
print("batch.meg.shape:",batch.meg.shape)
print("batch.subject_index:",batch.subject_index)
print("len of batch._event_lists:",len(batch._event_lists))
print("batch.features.shape:",batch.features.shape)

batch.meg.shape: torch.Size([8, 208, 361])
batch.subject_index: tensor([0, 0, 0, 0, 0, 0, 0, 0])
len of batch._event_lists: 8
batch.features.shape: torch.Size([8, 1025, 361])

SegmentDataset.__getitem__() > 
    self._get_feature(index) >
        self.features(start, stop) >
            feature_builder.__call__() >
                val = feature.get_on_overlap(event, overlap) > 
                    Wav2VecTransformer.get_on_overlap >
                        self._get_cached_tensor() >
                            self._compute_hidden_states >

feature_builder = solver.datasets.test.datasets[0].features
features = feature_builder.extract_features(batch.features, solver.used_features.keys())
batch = batch.replace(features=features.to(solver.device))
print("feature_builder:\n\t",feature_builder)
print("solver.used_features.keys():\n\t",solver.used_features.keys())
print("batch.features.shape:",batch.features.shape)
print("Transformer layers used for average:",feature_builder["Wav2VecTransformer"].layers) # Paper said they used the last four but here is diff.

feature_builder:
	 FeaturesBuilder([('Wav2VecTransformer', Wav2VecTransformer(120.0)), ('WordHash', WordHash(120.0))])
solver.used_features.keys():
	 odict_keys(['Wav2VecTransformer'])
batch.features.shape: torch.Size([8, 1024, 361])
Transformer layers used for average: [14, 15, 16, 17, 18]

feature_builder["Wav2VecTransformer"].model

Wav2Vec2Model(
  (feature_extractor): Wav2Vec2FeatureEncoder(
    (conv_layers): ModuleList(
      (0): Wav2Vec2LayerNormConvLayer(
        (conv): Conv1d(1, 512, kernel_size=(10,), stride=(5,))
        (layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
        (activation): GELUActivation()
      )
      (1-4): 4 x Wav2Vec2LayerNormConvLayer(
        (conv): Conv1d(512, 512, kernel_size=(3,), stride=(2,))
        (layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
        (activation): GELUActivation()
      )
      (5-6): 2 x Wav2Vec2LayerNormConvLayer(
        (conv): Conv1d(512, 512, kernel_size=(2,), stride=(2,))
        (layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
        (activation): GELUActivation()
      )
    )
  )
  (feature_projection): Wav2Vec2FeatureProjection(
    (layer_norm): LayerNorm((512,), eps=1e-05, elementwise_affine=True)
    (projection): Linear(in_features=512, out_features=1024, bias=True)
    (dropout): Dropout(p=0.1, inplace=False)
  )
  (encoder): Wav2Vec2EncoderStableLayerNorm(
    (pos_conv_embed): Wav2Vec2PositionalConvEmbedding(
      (conv): Conv1d(1024, 1024, kernel_size=(128,), stride=(1,), padding=(64,), groups=16)
      (padding): Wav2Vec2SamePadLayer()
      (activation): GELUActivation()
    )
    (layer_norm): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
    (dropout): Dropout(p=0.1, inplace=False)
    (layers): ModuleList(
      (0-23): 24 x Wav2Vec2EncoderLayerStableLayerNorm(
        (attention): Wav2Vec2Attention(
          (k_proj): Linear(in_features=1024, out_features=1024, bias=True)
          (v_proj): Linear(in_features=1024, out_features=1024, bias=True)
          (q_proj): Linear(in_features=1024, out_features=1024, bias=True)
          (out_proj): Linear(in_features=1024, out_features=1024, bias=True)
        )
        (dropout): Dropout(p=0.1, inplace=False)
        (layer_norm): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
        (feed_forward): Wav2Vec2FeedForward(
          (intermediate_dropout): Dropout(p=0.0, inplace=False)
          (intermediate_dense): Linear(in_features=1024, out_features=4096, bias=True)
          (intermediate_act_fn): GELUActivation()
          (output_dense): Linear(in_features=4096, out_features=1024, bias=True)
          (output_dropout): Dropout(p=0.1, inplace=False)
        )
        (final_layer_norm): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
      )
    )
  )
)

# Rescales the input MEG and features. If the MEG after rescaling
# still contains large values (e.g. more than `limit`) rejects the offending item.
batch, reject_mask = solver.scale_reject(batch) # see bm.norm.ScaleReject

print("# of meg_scalers:", len(solver.scale_reject.scaler.meg_scalers))
print(" Type of meg_scalers:", solver.scale_reject.scaler.meg_scalers[0])
print(" Clamp of meg_scalers:",solver.scale_reject.limit)
print("# of feature_scalers:", len(solver.scale_reject.scaler.feature_scalers))
print(" Type of feature_scalers:", solver.scale_reject.scaler.feature_scalers['Wav2VecTransformer'])

# of meg_scalers: 196
 Type of meg_scalers: <bm.norm.RobustScaler object at 0x7f25a7e9de20>
 Clamp of meg_scalers: 20.0
# of feature_scalers: 1
 Type of feature_scalers: <bm.norm.StandardScaler object at 0x7f25a50e58b0>

meg = batch.meg
features = batch.features
features_mask = torch.ones_like(batch.features_mask)

offset_meg_samples = int(150 / 1000 * sample_rate) # 150ms Residual See Sec 2.2.2 Brain module - Residual dilated convolutions. 
meg = meg[..., offset_meg_samples:]
offset_features_samples = offset_meg_samples
features = features[..., :-offset_features_samples]
features_mask = features_mask[..., :-offset_features_samples]

inputs = dict(meg=meg.to(features))
output = features

# estimate = solver.model(inputs, batch)
length = next(iter(inputs.values())).shape[-1]  # length of any of the inputs

# following code is the same as `inputs["meg"] = solver.model.merger(inputs["meg"], batch)`
meg = inputs["meg"]
B, C, T = meg.shape
positions = solver.model.merger.position_getter.get_positions(batch)
embedding = solver.model.merger.embedding(positions)
heads = solver.model.merger.heads[None].expand(B, -1, -1)
scores = torch.einsum("bcd,bod->boc", embedding.to(heads), heads)
weights = torch.softmax(scores, dim=2)
out = torch.einsum("bct,boc->bot", meg, weights)
inputs["meg"] = out

print("meg.shape",meg.shape)
print("positions",positions.shape)
print("solver.model.merger.embedding:", solver.model.merger.embedding)
print("out.shape", out.shape)

meg.shape torch.Size([8, 208, 343])
positions torch.Size([8, 208, 2])
solver.model.merger.embedding: FourierEmb()
out.shape torch.Size([8, 270, 343])

# following code is the same as `embedding = solver.model.merger.embedding(positions)`
import math
n_freqs = (2048 // 2)**0.5 # 32
freqs_y = torch.arange(n_freqs).to(positions) # torch.Size([32])
freqs_x = freqs_y[:, None] # torch.Size([32, 1])
width = 1 + 2 * 0.2
positions = positions + 0.2
p_x = 2 * math.pi * freqs_x / width # torch.Size([32, 1])
p_y = 2 * math.pi * freqs_y / width # torch.Size([32])
positions = positions[..., None, None, :]
loc = (positions[..., 0] * p_x + positions[..., 1] * p_y).view(*O, -1) # torch.Size([8, 208, 32, 32]) -> torch.Size([8, 208, 1024])
embedding = torch.cat([torch.cos(loc),torch.sin(loc)], dim=-1) # torch.Size([8, 208, 2048])

inputs["meg"] = solver.model.initial_linear(inputs["meg"])
solver.model.initial_linear

Sequential(
  (0): Conv1d(270, 270, kernel_size=(1,), stride=(1,))
)

subjects = batch.subject_index.to(device=features.device,dtype=torch.int64)
inputs["meg"] = solver.model.subject_layers(inputs["meg"], subjects) # see bm.common.SubjectLayers

solver.model.subject_layers

SubjectLayers(270, 270, 27)

encoded = {}
for name, x in inputs.items():
    encoded[name] = solver.model.encoders[name](x)

inputs = [x[1] for x in sorted(encoded.items())]
x = torch.cat(inputs, dim=1)
x = solver.model.final(x)

assert x.shape[-1] >= length
estimate = x[:, :, :length]

solver.model.encoders

ModuleDict(
  (meg): ConvSequence(
    (sequence): ModuleList(
      (0): Sequential(
        (0): Conv1d(270, 320, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (1): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (2): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (3): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (4): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (5): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (6): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (7): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (8): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
      (9): Sequential(
        (0): Conv1d(320, 320, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))
        (1): BatchNorm1d(320, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): GELU(approximate='none')
      )
    )
    (glus): ModuleList(
      (0): None
      (1): Sequential(
        (0): Conv1d(320, 640, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): GLU(dim=1)
      )
      (2): None
      (3): Sequential(
        (0): Conv1d(320, 640, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): GLU(dim=1)
      )
      (4): None
      (5): Sequential(
        (0): Conv1d(320, 640, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): GLU(dim=1)
      )
      (6): None
      (7): Sequential(
        (0): Conv1d(320, 640, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): GLU(dim=1)
      )
      (8): None
      (9): Sequential(
        (0): Conv1d(320, 640, kernel_size=(3,), stride=(1,), padding=(1,))
        (1): GLU(dim=1)
      )
    )
  )
)

pred, trues, features_mask, reject_mask = estimate, output, features_mask, reject_mask

clip = solver.loss
candidates = trues.cuda() # Setup negatives
probs = clip.get_probabilities(pred.cuda(), candidates).cpu()

candidates.shape, probs.shape

(torch.Size([8, 1024, 343]), torch.Size([8, 8]))

evaluator = Evaluator("97d170e1", shuffle_test_data=False)
evaluator.solver.args.num_workers = 20
# Load test data
evaluator.load_test_data(
    n_recordings=None, # conf.n_recordings None
    batch_size=1000, # conf.load_batch_size 1000
    test_study="gwilliams2022")

[11-14 22:39:10][scripts.run_eval_probs][INFO] - Loading solver 97d170e1
[11-14 22:39:10][bm.play][INFO] - Loading solver from XP 97d170e1. Overrides used: ['dset.selections=[gwilliams2022]']
[11-14 22:39:10][bm._env][WARNING] - Hostname gpu226.corp.yodao.com not defined in /conf/study_paths/study_paths.yaml. Using default paths.

[11-14 22:39:10][bm.dataset][WARNING] - Requested 1000 recordings but only found 196
[11-14 22:39:21][bm.dataset][INFO] - Loading Subjects | 39/196 | 6.21 it/sec
[11-14 22:39:27][bm.dataset][INFO] - Loading Subjects | 78/196 | 6.09 it/sec
[11-14 22:39:34][bm.dataset][INFO] - Loading Subjects | 117/196 | 6.05 it/sec
[11-14 22:39:41][bm.dataset][INFO] - Loading Subjects | 156/196 | 5.83 it/sec
[11-14 22:39:48][bm.dataset][INFO] - Loading Subjects | 195/196 | 5.84 it/sec
[11-14 22:39:48][bm.dataset][INFO] - # Examples (train | valid | test): 203152 | 35156 | 69972
[11-14 22:39:48][bm.train][INFO] - Model hash: ed97b0fbdffe06faf696d2eecaacb57b143fd68d
/ssd3/other/penglinkai01/miniconda3/envs/bm/lib/python3.8/site-packages/flashy/loggers/tensorboard.py:47: UserWarning: tensorboard package was not found: use pip install tensorboard
  warnings.warn("tensorboard package was not found: use pip install tensorboard")
[11-14 22:39:48][scripts.run_eval_probs][INFO] - Extracting test data

[11-14 22:40:33][scripts.run_eval_probs][INFO] - extract | 3/70 | 10.8 sec/it
[11-14 22:40:41][scripts.run_eval_probs][INFO] - extract | 6/70 | 0.14 it/sec
[11-14 22:40:49][scripts.run_eval_probs][INFO] - extract | 9/70 | 0.17 it/sec
[11-14 22:40:58][scripts.run_eval_probs][INFO] - extract | 12/70 | 0.19 it/sec
[11-14 22:41:07][scripts.run_eval_probs][INFO] - extract | 15/70 | 0.21 it/sec
[11-14 22:41:19][scripts.run_eval_probs][INFO] - extract | 18/70 | 0.21 it/sec
[11-14 22:41:30][scripts.run_eval_probs][INFO] - extract | 21/70 | 0.22 it/sec
[11-14 22:41:39][scripts.run_eval_probs][INFO] - extract | 24/70 | 0.23 it/sec
[11-14 22:41:48][scripts.run_eval_probs][INFO] - extract | 27/70 | 0.24 it/sec
[11-14 22:41:57][scripts.run_eval_probs][INFO] - extract | 30/70 | 0.24 it/sec
[11-14 22:42:07][scripts.run_eval_probs][INFO] - extract | 33/70 | 0.25 it/sec
[11-14 22:42:16][scripts.run_eval_probs][INFO] - extract | 36/70 | 0.25 it/sec
[11-14 22:42:26][scripts.run_eval_probs][INFO] - extract | 39/70 | 0.26 it/sec
[11-14 22:42:36][scripts.run_eval_probs][INFO] - extract | 42/70 | 0.26 it/sec
[11-14 22:42:45][scripts.run_eval_probs][INFO] - extract | 45/70 | 0.26 it/sec
[11-14 22:42:54][scripts.run_eval_probs][INFO] - extract | 48/70 | 0.27 it/sec
[11-14 22:43:04][scripts.run_eval_probs][INFO] - extract | 51/70 | 0.27 it/sec
[11-14 22:43:14][scripts.run_eval_probs][INFO] - extract | 54/70 | 0.27 it/sec
[11-14 22:43:24][scripts.run_eval_probs][INFO] - extract | 57/70 | 0.27 it/sec
[11-14 22:43:34][scripts.run_eval_probs][INFO] - extract | 60/70 | 0.27 it/sec
[11-14 22:43:44][scripts.run_eval_probs][INFO] - extract | 63/70 | 0.27 it/sec
[11-14 22:43:54][scripts.run_eval_probs][INFO] - extract | 66/70 | 0.27 it/sec
[11-14 22:44:04][scripts.run_eval_probs][INFO] - extract | 69/70 | 0.28 it/sec

preds, trues = evaluator.preds, evaluator.trues

clip = evaluator.solver.loss

# Setup negatives
candidates = trues.cuda()

# Loop over samples
loader = DataLoader(TensorDataset(preds, torch.arange(0, len(preds)),),batch_size=8)
probs = torch.zeros(len(preds), len(trues))
lp = flashy.logging.LogProgressBar(logger, loader, updates=20, name='probs')
for preds_, idx_ in lp:
    # Compute probabilities
    probs_ = clip.get_probabilities(preds_.cuda(), candidates).cpu()
    # Update
    probs[idx_] = probs_

[11-14 22:44:32][__main__][INFO] - probs | 437/8747 | 60.30 it/sec
[11-14 22:44:39][__main__][INFO] - probs | 874/8747 | 61.85 it/sec
[11-14 22:44:45][__main__][INFO] - probs | 1311/8747 | 62.29 it/sec
[11-14 22:44:54][__main__][INFO] - probs | 1748/8747 | 58.44 it/sec
[11-14 22:45:12][__main__][INFO] - probs | 2185/8747 | 45.84 it/sec
[11-14 22:45:45][__main__][INFO] - probs | 2622/8747 | 32.59 it/sec
[11-14 22:46:06][__main__][INFO] - probs | 3059/8747 | 30.19 it/sec
[11-14 22:46:24][__main__][INFO] - probs | 3496/8747 | 29.15 it/sec
[11-14 22:46:54][__main__][INFO] - probs | 3933/8747 | 26.34 it/sec
[11-14 22:47:10][__main__][INFO] - probs | 4370/8747 | 26.31 it/sec
[11-14 22:47:36][__main__][INFO] - probs | 4807/8747 | 25.09 it/sec
[11-14 22:48:16][__main__][INFO] - probs | 5244/8747 | 22.61 it/sec
[11-14 22:48:55][__main__][INFO] - probs | 5681/8747 | 21.00 it/sec
[11-14 22:49:18][__main__][INFO] - probs | 6118/8747 | 20.86 it/sec
[11-14 22:49:55][__main__][INFO] - probs | 6555/8747 | 19.85 it/sec
[11-14 22:50:23][__main__][INFO] - probs | 6992/8747 | 19.48 it/sec
[11-14 22:50:58][__main__][INFO] - probs | 7429/8747 | 18.87 it/sec
[11-14 22:51:20][__main__][INFO] - probs | 7866/8747 | 18.94 it/sec
[11-14 22:51:37][__main__][INFO] - probs | 8303/8747 | 19.19 it/sec
[11-14 22:52:14][__main__][INFO] - probs | 8740/8747 | 18.61 it/sec

# probs, target_labels, vocab_labels
# probs_segment, segment_hashes, vocab_segment 
target_labels = evaluator.metadata["segment_hashes"]
vocab_labels = evaluator.trues_segment_hashes
for topk in (1, 5, 10):
    # Extract topk indices
    idx = probs.topk(topk, dim=1).indices
    
    # Get the corresponding topk labels
    whs = vocab_labels[idx.view(-1)].reshape(idx.shape)
    
    # 1 if the labels matches with the targets
    correct = ((whs == target_labels[:, None]).any(1)).float()
    
    # Average across samples
    acc = correct.mean()
    logger.info("Top-%d acc: %.2f", topk, 100 * acc)

[11-14 22:52:14][__main__][INFO] - Top-1 acc: 41.16
[11-14 22:52:14][__main__][INFO] - Top-5 acc: 62.52
[11-14 22:52:14][__main__][INFO] - Top-10 acc: 70.60

Measurement date	January 01, 2000 00:00:00 GMT
Experimenter	mne_anonymize
Participant	sub-01
Digitized points	Not available
Good channels	208 Magnetometers
Bad channels	None
EOG channels	Not available
ECG channels	Not available
Sampling frequency	1000.00 Hz
Highpass	0.03 Hz
Lowpass	200.00 Hz

	story	story_uid	sound_id	kind	start	sound	duration	filepath	phoneme	sequence_id	...	speech_rate	voice	pronounced	word	language	modality	word_sequence	phoneme_id	offset	uid
0	NaN	NaN	NaN	block	23.506	NaN	6.250000	NaN	NaN	NaN	...	NaN	NaN	NaN	NaN	english	audio	NaN	NaN	NaN	Tara stood stock still waiting for the first t...
1	lw1	0.0	0.0	word	23.506	stimuli/audio/lw1_0.wav	0.300000	NaN	NaN	0.0	...	205.0	Allison	1.0	Tara	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
2	lw1	0.0	0.0	sound	23.506	stimuli/audio/lw1_0.0.wav	95.881678	/ssd3/other/penglinkai01/brainmagick/data/gwil...	NaN	NaN	...	NaN	NaN	NaN	NaN	english	audio	NaN	NaN	0.0	NaN
3	lw1	0.0	0.0	phoneme	23.506	stimuli/audio/lw1_0.wav	0.080000	NaN	t_B	0.0	...	205.0	Allison	1.0	NaN	english	audio	NaN	0.0	NaN	NaN
4	lw1	0.0	0.0	phoneme	23.586	stimuli/audio/lw1_0.wav	0.090000	NaN	eh_I	0.0	...	205.0	Allison	1.0	NaN	english	audio	NaN	1.0	NaN	NaN

	story	story_uid	sound_id	kind	start	sound	duration	filepath	phoneme	sequence_id	...	speech_rate	voice	pronounced	word	language	modality	word_sequence	phoneme_id	offset	uid
1	lw1	0.0	0.0	word	23.506	stimuli/audio/lw1_0.wav	0.30	NaN	NaN	0.0	...	205.0	Allison	1.0	Tara	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
7	lw1	0.0	0.0	word	23.816	stimuli/audio/lw1_0.wav	0.24	NaN	NaN	0.0	...	205.0	Allison	1.0	stood	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
13	lw1	0.0	0.0	word	24.056	stimuli/audio/lw1_0.wav	0.37	NaN	NaN	0.0	...	205.0	Allison	1.0	stock	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
17	lw1	0.0	0.0	word	24.586	stimuli/audio/lw1_0.wav	0.40	NaN	NaN	0.0	...	205.0	Allison	1.0	still	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
23	lw1	0.0	0.0	word	25.136	stimuli/audio/lw1_0.wav	0.41	NaN	NaN	0.0	...	205.0	Allison	1.0	waiting	english	audio	Tara stood stock still waiting for the first t...	NaN	NaN	NaN
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
3147	lw1	0.0	3.0	word	361.097	stimuli/audio/lw1_3.wav	0.17	NaN	NaN	52.0	...	205.0	Allison	1.0	end	english	audio	Tara would not let giddy hopes drag them onto ...	NaN	NaN	NaN
3150	lw1	0.0	3.0	word	361.277	stimuli/audio/lw1_3.wav	0.14	NaN	NaN	52.0	...	205.0	Allison	1.0	for	english	audio	Tara would not let giddy hopes drag them onto ...	NaN	NaN	NaN
3154	lw1	0.0	3.0	word	361.487	stimuli/audio/lw1_3.wav	0.58	NaN	NaN	52.0	...	205.0	Allison	1.0	project	english	audio	Tara would not let giddy hopes drag them onto ...	NaN	NaN	NaN
3162	lw1	0.0	3.0	word	362.207	stimuli/audio/lw1_3.wav	0.15	NaN	NaN	52.0	...	205.0	Allison	1.0	and	english	audio	Tara would not let giddy hopes drag them onto ...	NaN	NaN	NaN
3165	lw1	0.0	3.0	word	362.817	stimuli/audio/lw1_3.wav	0.34	NaN	NaN	52.0	...	205.0	Allison	1.0	species	english	audio	Tara would not let giddy hopes drag them onto ...	NaN	NaN	NaN

Measurement date	January 01, 2000 00:00:00 GMT
Experimenter	mne_anonymize
Participant	sub-01
Digitized points	Not available
Good channels	208 Magnetometers
Bad channels	None
EOG channels	Not available
ECG channels	Not available
Sampling frequency	120.00 Hz
Highpass	0.03 Hz
Lowpass	200.00 Hz
Duration	00:06:36 (HH:MM:SS)

	start	duration	modality	language	uid	kind	split
0	0.000	29.756	audio	english	Tara stood stock still waiting for the first t...	block	1
1	29.756	10.340	audio	english	The gentle constant breeze of recycled air fro...	block	2
2	40.096	28.320	audio	english	Results Harmon she suppressed the surge of ann...	block	0

Part One: Decoding speech perception from non-invasive brain recordings¶

1.Dataset¶

2.Method¶

Wav2vec 2.0¶

Brain module¶

Spatial attention¶

Subject Layer¶

Residual dilated convolutions¶

CLIP loss¶

Result¶

Discussion¶

Clamping	Brennan (EEG)	Broderick (EEG)	Gwilliams (MEG)	Schoffelen (MEG)
20	25.7 ± 2.9	17.7 ± 0.6	70.7 ± 0.1	67.5 ± 0.4
100	27.1 ± 2.6	7.6 ± 0.0	70.6 ± 0.3	67.2 ± 0.9
None	14.1 ± 1.0	0.5 ± 0.0	23.6 ± 24.6	1.5 ± 0.3