跳转至

专题二——S5源码解读

论文:SIMPLIFIED STATE SPACE LAYERS FOR SEQUENCE MODELING(ICLR 2023 Top-5%) 代码连接:github

专题二——S5模型源码解读

一、
附录——可供运行S5代码的一种环境依赖关系

·显卡驱动要求:cuda >= 11.6
[注]jaxlib/torch相关环境(Version部分包含cuda/cudnnpackage)需手动下载、安装。

Package                      Version
---------------------------- ---------------------
absl-py                      2.1.0
aiohttp                      3.8.6
aiosignal                    1.3.1
altair                       5.0.1
annotated-types              0.5.0
appdirs                      1.4.4
astunparse                   1.6.3
async-timeout                4.0.3
asynctest                    0.13.0
attrs                        21.2.0
backcall                     0.2.0
backports.cached-property    1.0.2
backports.zoneinfo           0.2.1
blessed                      1.20.0
blinker                      1.6.3
build                        0.10.0
CacheControl                 0.12.14
cachetools                   5.3.3
causal-conv1d                1.2.0.post2
certifi                      2024.2.2
cffi                         1.15.1
charset-normalizer           3.3.2
chex                         0.1.5
cleo                         2.1.0
click                        8.1.7
cloudpickle                  2.2.1
colorama                     0.4.6
commonmark                   0.9.1
crashtest                    0.4.1
cryptography                 42.0.7
cv                           1.0.0
cycler                       0.11.0
datasets                     2.13.2
decorator                    5.1.1
deepchem                     2.7.1
dgl                          1.1.3
dgllife                      0.3.2
dill                         0.3.6
diskcache                    5.6.3
distlib                      0.3.8
dm-tree                      0.1.8
dnspython                    2.3.0
docker                       6.1.3
docker-pycreds               0.4.0
dulwich                      0.21.7
einops                       0.6.1
entrypoints                  0.4
filelock                     3.12.2
flatbuffers                  24.3.25
flax                         0.6.1
fonttools                    4.38.0
frozenlist                   1.3.3
fsspec                       2023.1.0
future                       1.0.0
gast                         0.4.0
gitdb                        4.0.11
GitPython                    3.1.42
google-auth                  2.28.1
google-auth-oauthlib         0.4.6
google-pasta                 0.2.0
gpustat                      1.1.1
grpcio                       1.62.0
h5py                         3.8.0
html5lib                     1.1
huggingface-hub              0.16.4
hyperopt                     0.2.7
idna                         3.6
imageio                      2.31.2
importlib-metadata           6.7.0
importlib-resources          5.12.0
installer                    0.7.0
ipykernel                    5.5.5
ipython                      7.33.0
ipython-genutils             0.2.0
jaraco.classes               3.2.3
jax                          0.3.25
jaxlib                       0.3.25+cuda11.cudnn82
jedi                         0.19.1
jeepney                      0.8.0
Jinja2                       3.1.3
joblib                       1.3.2
jsonnet                      0.15.0
jsonschema                   4.17.3
jupyter-client               5.3.4
jupyter_core                 4.12.0
keras                        2.11.0
keyring                      23.13.1
kiwisolver                   1.4.5
libclang                     18.1.1
lie-learn                    0.0.1.post1
lightning-utilities          0.10.1
lmdb                         1.4.1
lockfile                     0.12.2
lxml                         4.6.3
mamba-ssm                    1.2.0.post1
Markdown                     3.4.4
markdown-it-py               2.2.0
MarkupSafe                   2.1.5
matplotlib                   3.5.3
matplotlib-inline            0.1.6
mdurl                        0.1.2
more-itertools               9.1.0
msgpack                      1.0.5
multidict                    6.0.5
multiprocess                 0.70.14
networkx                     2.6.3
ninja                        1.11.1.1
numpy                        1.21.6
nums-from-string             0.1.2
nvidia-ml-py                 12.535.133
oauthlib                     3.2.2
opencv-python                4.9.0.80
opt-einsum                   3.3.0
optax                        0.1.4
packaging                    23.2
pandas                       1.3.5
parso                        0.8.3
patsy                        0.5.6
pexpect                      4.9.0
pickleshare                  0.7.5
Pillow                       9.5.0
pip                          24.0
pkginfo                      1.10.0
pkgutil_resolve_name         1.3.10
platformdirs                 3.11.0
poetry                       1.5.1
poetry-core                  1.6.1
poetry-plugin-export         1.4.0
prompt-toolkit               3.0.42
protobuf                     3.20.0
pscan                        1.0.1
psutil                       5.9.8
ptyprocess                   0.7.0
py4j                         0.10.9.7
pyarrow                      12.0.1
pyasn1                       0.5.1
pyasn1-modules               0.3.0
pycparser                    2.21
pydantic                     2.5.3
pydantic_core                2.14.6
pydeck                       0.8.1b1
pyg-lib                      0.2.0+pt113cu116
Pygments                     2.17.2
pymongo                      4.6.2
Pympler                      1.0.1
pyparsing                    3.1.1
pyproject_hooks              1.1.0
pyrsistent                   0.19.3
python-dateutil              2.8.2
python-Levenshtein           0.12.0
pytorch-lightning            1.9.5
pytorch-model-summary        0.1.2
pytz                         2024.1
pytz-deprecation-shim        0.1.0.post0
PyYAML                       6.0.1
pyzmq                        24.0.1
rapidfuzz                    3.4.0
rdkit                        2023.3.2
regex                        2023.12.25
requests                     2.31.0
requests-oauthlib            1.3.1
requests-toolbelt            1.0.0
rich                         11.1.0
rsa                          4.9
rxn-chem-utils               1.5.0
rxn-utils                    1.6.0
rxnmapper                    0.3.0
safetensors                  0.4.2
scikit-learn                 1.0.2
scipy                        1.7.3
seaborn                      0.12.2
SecretStorage                3.3.3
sentencepiece                0.1.91
sentry-sdk                   1.42.0
setproctitle                 1.3.3
setuptools                   65.6.3
shellingham                  1.5.4
six                          1.16.0
smmap                        5.0.1
soupsieve                    2.4.1
statsmodels                  0.13.5
streamlit                    1.23.1
tenacity                     8.2.3
tensorboard                  2.11.2
tensorboard-data-server      0.6.1
tensorboard-plugin-wit       1.8.1
tensorflow                   2.11.0
tensorflow-estimator         2.11.0
tensorflow-io-gcs-filesystem 0.34.0
termcolor                    2.3.0
threadpoolctl                3.1.0
tokenizers                   0.11.1
toml                         0.10.2
tomli                        2.0.1
tomlkit                      0.12.5
toolz                        0.12.1
torch                        1.13.1+cu116
torch-cluster                1.6.1+pt113cu116
torch-scatter                2.1.1+pt113cu116
torch-sparse                 0.6.17+pt113cu116
torch-spline-conv            1.2.2+pt113cu116
torchaudio                   0.13.1+cu116
torchmetrics                 0.11.4
torchtext                    0.14.1
torchvision                  0.14.1+cu116
tornado                      6.2
tqdm                         4.66.4
traitlets                    5.9.0
transformers                 4.30.2
triton                       2.3.0
trove-classifiers            2024.5.22
typing_extensions            4.7.1
tzdata                       2024.1
tzlocal                      4.3.1
urllib3                      1.26.18
validators                   0.20.0
virtualenv                   20.26.2
wandb                        0.16.4
watchdog                     3.0.0
wcwidth                      0.1.9
webencodings                 0.5.1
websocket-client             1.6.1
Werkzeug                     2.2.3
wheel                        0.42.0
wrapt                        1.16.0
xxhash                       3.4.1
yarl                         1.9.4
zipp                         3.15.0