cffan
diff --git a/‎.gitignore‎
Lines changed: 40 additions & 0 deletions b/‎.gitignore‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 14 additions & 0 deletions b/‎README.md‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎notebooks/formatCompetitionData.ipynb‎
Lines changed: 330 additions & 0 deletions b/‎notebooks/formatCompetitionData.ipynb‎
Lines changed: 330 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 2 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎scripts/eval_competition.py‎
Lines changed: 143 additions & 0 deletions b/‎scripts/eval_competition.py‎
Lines changed: 143 additions & 0 deletions
diff --git a/‎scripts/eval_competition.sh‎
Lines changed: 21 additions & 0 deletions b/‎scripts/eval_competition.sh‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎scripts/train_model.py‎
Lines changed: 29 additions & 0 deletions b/‎scripts/train_model.py‎
Lines changed: 29 additions & 0 deletions
diff --git a/‎setup.cfg‎
Lines changed: 59 additions & 0 deletions b/‎setup.cfg‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎setup.py‎
Lines changed: 22 additions & 0 deletions b/‎setup.py‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎src/neural_decoder.egg-info/PKG-INFO‎
Lines changed: 22 additions & 0 deletions b/‎src/neural_decoder.egg-info/PKG-INFO‎
Lines changed: 22 additions & 0 deletions
@@ -0,0 +1,40 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# Visual Studio Code files
+.vscode
+.vs
+
+# PyCharm files
+.idea
+
+# Eclipse Project settings
+*.*project
+.settings
+
+# Sublime Text settings
+*.sublime-workspace
+*.sublime-project
+
+# Editor temporaries
+*.swn
+*.swo
+*.swp
+*.swm
+*.asv
+*~
+
+# IPython notebook checkpoints
+.ipynb_checkpoints
+
+# macOS dir files
+.DS_Store
+
+**/build
+
+Archive/*
+
+# Matlab
+*.asv
@@ -0,0 +1,14 @@
+## Pytorch implementation of [Neural Sequence Decoder](https://github.com/fwillett/speechBCI/tree/main/NeuralDecoder)
+
+## Requirements
+- python >= 3.9
+
+## Installation
+
+pip install -e .
+
+## How to run
+
+1. Convert the speech BCI dataset using [formatCompetitionData.ipynb](./notebooks/formatCompetitionData.ipynb)
+2. Train model: `python ./scripts/train_model.py`
+
@@ -0,0 +1,2 @@
+[build-system]
+requires = ["setuptools>=46.1.0"]
@@ -0,0 +1,143 @@
+import re
+import time
+import pickle
+import numpy as np
+
+from edit_distance import SequenceMatcher
+import torch
+from dataset import SpeechDataset
+
+import matplotlib.pyplot as plt
+
+
+from nnDecoderModel import getDatasetLoaders
+from nnDecoderModel import loadModel
+import neuralDecoder.utils.lmDecoderUtils as lmDecoderUtils
+import pickle
+import argparse
+
+parser = argparse.ArgumentParser(description="")
+parser.add_argument("--modelPath", type=str, default=None, help="Path to model")
+input_args = parser.parse_args()
+
+
+with open(input_args.modelPath + "/args", "rb") as handle:
+    args = pickle.load(handle)
+
+args["datasetPath"] = "/oak/stanford/groups/henderj/stfan/data/ptDecoder_ctc"
+trainLoaders, testLoaders, loadedData = getDatasetLoaders(
+    args["datasetPath"], args["seqLen"], args["maxTimeSeriesLen"], args["batchSize"]
+)
+
+model = loadModel(input_args.modelPath, device="cpu")
+
+device = "cpu"
+
+model.eval()
+
+rnn_outputs = {
+    "logits": [],
+    "logitLengths": [],
+    "trueSeqs": [],
+    "transcriptions": [],
+}
+partition = "competition"
+for i, testDayIdx in enumerate([4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 18, 19, 20]):
+    # for i, testDayIdx in enumerate(range(len(loadedData[partition]))):
+    test_ds = SpeechDataset([loadedData[partition][i]])
+    test_loader = torch.utils.data.DataLoader(
+        test_ds, batch_size=1, shuffle=False, num_workers=0
+    )
+    for j, (X, y, X_len, y_len, _) in enumerate(test_loader):
+        X, y, X_len, y_len, dayIdx = (
+            X.to(device),
+            y.to(device),
+            X_len.to(device),
+            y_len.to(device),
+            torch.tensor([testDayIdx], dtype=torch.int64).to(device),
+        )
+        pred = model.forward(X, dayIdx)
+        adjustedLens = ((X_len - model.kernelLen) / model.strideLen).to(torch.int32)
+
+        for iterIdx in range(pred.shape[0]):
+            trueSeq = np.array(y[iterIdx][0 : y_len[iterIdx]].cpu().detach())
+
+            rnn_outputs["logits"].append(pred[iterIdx].cpu().detach().numpy())
+            rnn_outputs["logitLengths"].append(
+                adjustedLens[iterIdx].cpu().detach().item()
+            )
+            rnn_outputs["trueSeqs"].append(trueSeq)
+
+        transcript = loadedData[partition][i]["transcriptions"][j].strip()
+        transcript = re.sub(r"[^a-zA-Z\- \']", "", transcript)
+        transcript = transcript.replace("--", "").lower()
+        rnn_outputs["transcriptions"].append(transcript)
+
+
+MODEL_CACHE_DIR = "/scratch/users/stfan/huggingface"
+# Load OPT 6B model
+llm, llm_tokenizer = lmDecoderUtils.build_opt(
+    cacheDir=MODEL_CACHE_DIR, device="auto", load_in_8bit=True
+)
+
+lmDir = "/oak/stanford/groups/henderj/stfan/code/nptlrig2/LanguageModelDecoder/examples/speech/s0/lm_order_exp/5gram/data/lang_test"
+ngramDecoder = lmDecoderUtils.build_lm_decoder(
+    lmDir, acoustic_scale=0.5, nbest=100, beam=18
+)
+
+
+
+# LM decoding hyperparameters
+acoustic_scale = 0.5
+blank_penalty = np.log(7)
+llm_weight = 0.5
+
+llm_outputs = []
+# Generate nbest outputs from 5gram LM
+start_t = time.time()
+nbest_outputs = []
+for j in range(len(rnn_outputs["logits"])):
+    logits = rnn_outputs["logits"][j]
+    logits = np.concatenate(
+        [logits[:, 1:], logits[:, 0:1]], axis=-1
+    )  # Blank is last token
+    logits = lmDecoderUtils.rearrange_speech_logits(logits[None, :, :], has_sil=True)
+    nbest = lmDecoderUtils.lm_decode(
+        ngramDecoder,
+        logits[0],
+        blankPenalty=blank_penalty,
+        returnNBest=True,
+        rescore=True,
+    )
+    nbest_outputs.append(nbest)
+time_per_sample = (time.time() - start_t) / len(rnn_outputs["logits"])
+print(f"5gram decoding took {time_per_sample} seconds per sample")
+
+for i in range(len(rnn_outputs["transcriptions"])):
+    new_trans = [ord(c) for c in rnn_outputs["transcriptions"][i]] + [0]
+    rnn_outputs["transcriptions"][i] = np.array(new_trans)
+
+# Rescore nbest outputs with LLM
+start_t = time.time()
+llm_out = lmDecoderUtils.cer_with_gpt2_decoder(
+    llm,
+    llm_tokenizer,
+    nbest_outputs[:],
+    acoustic_scale,
+    rnn_outputs,
+    outputType="speech_sil",
+    returnCI=True,
+    lengthPenalty=0,
+    alpha=llm_weight,
+)
+# time_per_sample = (time.time() - start_t) / len(logits)
+print(f"LLM decoding took {time_per_sample} seconds per sample")
+
+print(llm_out["cer"], llm_out["wer"])
+with open(input_args.modelPath + "/llm_out", "wb") as handle:
+    pickle.dump(llm_out, handle)
+
+decodedTranscriptions = llm_out["decoded_transcripts"]
+with open(input_args.modelPath + "/5gramLLMCompetitionSubmission.txt", "w") as f:
+    for x in range(len(decodedTranscriptions)):
+        f.write(decodedTranscriptions[x] + "\n")
@@ -0,0 +1,21 @@
+#!/bin/bash
+
+# Parameters
+#SBATCH --cpus-per-task=8
+#SBATCH --gpus-per-task=1
+#SBATCH --job-name=rescore
+#SBATCH --mail-type=ALL
+#SBATCH --mem=400GB
+#SBATCH --nodes=1
+#SBATCH --ntasks-per-node=1
+#SBATCH --open-mode=append
+#SBATCH --partition=henderj,owners
+#SBATCH --signal=USR1@120
+#SBATCH --time=2880
+#SBATCH --constraint=[GPU_MEM:32GB|GPU_MEM:40GB|GPU_MEM:80GB]
+
+ml gcc/10.1.0
+ml load cudnn/8.6.0.163
+ml load cuda/11.7.1
+
+python eval_competition.py --modelPath=$1
@@ -0,0 +1,29 @@
+
+modelName = 'speechBaseline4'
+
+args = {}
+args['outputDir'] = '/oak/stanford/groups/henderj/stfan/logs/speech_logs/' + modelName
+args['datasetPath'] = '/oak/stanford/groups/henderj/fwillett/speech/ptDecoder_ctc'
+args['seqLen'] = 150
+args['maxTimeSeriesLen'] = 1200
+args['batchSize'] = 64
+args['lrStart'] = 0.02
+args['lrEnd'] = 0.02
+args['nUnits'] = 1024
+args['nBatch'] = 10000 #3000
+args['nLayers'] = 5
+args['seed'] = 0
+args['nClasses'] = 40
+args['nInputFeatures'] = 256
+args['dropout'] = 0.4
+args['whiteNoiseSD'] = 0.8
+args['constantOffsetSD'] = 0.2
+args['gaussianSmoothWidth'] = 2.0
+args['strideLen'] = 4
+args['kernelLen'] = 32
+args['bidirectional'] = True
+args['l2_decay'] = 1e-5
+
+from neural_decoder.neural_decoder_trainer import trainModel
+
+trainModel(args)
@@ -0,0 +1,59 @@
+# This file is used to configure your project.
+# Read more about the various options under:
+# https://setuptools.pypa.io/en/latest/userguide/declarative_config.html
+# https://setuptools.pypa.io/en/latest/references/keywords.html
+
+[metadata]
+name = neural_decoder
+description = PyTorch neural sequence decoder for speech BCI (https://github.com/fwillett/speechBCI/tree/main/NeuralDecoder)
+version = 0.0.1
+author = Chaofei Fan, Frank Willett
+author_email = stfan@stanford.edu
+license = MIT
+license_files = LICENSE.txt
+# Add here related links, for example:
+project_urls =
+
+# Change if running only on Windows, Mac or Linux (comma-separated)
+platforms = Linux
+
+# Add here all kinds of additional classifiers as defined under
+# https://pypi.org/classifiers/
+classifiers =
+    Development Status :: 4 - Beta
+    Programming Language :: Python
+
+
+[options]
+zip_safe = False
+packages = find_namespace:
+include_package_data = True
+package_dir =
+    =src
+
+# Require a min/specific Python version (comma-separated conditions)
+python_requires = >=3.9
+
+# Add here dependencies of your project (line-separated), e.g. requests>=2.2,<3.0.
+# Version specifiers like >=2.2,<3.0 avoid problems due to API changes in
+# new major versions. This works if the required packages follow Semantic Versioning.
+# For more information, check out https://semver.org/.
+install_requires =
+    importlib-metadata; python_version<"3.8"
+    torch==1.13.1 
+    hydra-core==1.3.2
+    hydra-submitit-launcher==1.1.5
+    hydra-optuna-sweeper==1.2.0
+    numpy==1.25.0
+    scipy==1.11.1
+    numba==0.58.1
+    scikit-learn==1.3.2
+    g2p_en==2.1.0
+    edit_distance==1.0.6
+
+
+[options.packages.find]
+where = src
+exclude =
+    tests
+    examples
@@ -0,0 +1,22 @@
+"""
+    Setup file for OnlineRecalibrator.
+    Use setup.cfg to configure your project.
+
+    This file was generated with PyScaffold 4.5.
+    PyScaffold helps you to put up the scaffold of your new Python project.
+    Learn more under: https://pyscaffold.org/
+"""
+from setuptools import setup
+
+if __name__ == "__main__":
+    try:
+        setup(
+        )
+    except:  # noqa
+        print(
+            "\n\nAn error occurred while building the project, "
+            "please ensure you have the most updated version of setuptools, "
+            "setuptools_scm and wheel with:\n"
+            "   pip install -U setuptools setuptools_scm wheel\n\n"
+        )
+        raise
@@ -0,0 +1,22 @@
+Metadata-Version: 2.1
+Name: neural_decoder
+Version: 0.0.1
+Summary: PyTorch neural sequence decoder for speech BCI (https://github.com/fwillett/speechBCI/tree/main/NeuralDecoder)
+Author: Chaofei Fan, Frank Willett
+Author-email: stfan@stanford.edu
+License: MIT
+Platform: Linux
+Classifier: Development Status :: 4 - Beta
+Classifier: Programming Language :: Python
+Requires-Python: >=3.9
+Requires-Dist: importlib-metadata; python_version < "3.8"
+Requires-Dist: torch==1.13.1
+Requires-Dist: hydra-core==1.3.2
+Requires-Dist: hydra-submitit-launcher==1.1.5
+Requires-Dist: hydra-optuna-sweeper==1.2.0
+Requires-Dist: numpy==1.25.0
+Requires-Dist: scipy==1.11.1
+Requires-Dist: numba==0.58.1
+Requires-Dist: scikit-learn==1.3.2
+Requires-Dist: g2p_en==2.1.0
+Requires-Dist: edit_distance==1.0.6
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+[build-system]`
	`2`	`+requires = ["setuptools>=46.1.0"]`