diff --git a/.dockerignore b/.dockerignore deleted file mode 100644 index a540e11fc8285e9d3c70f3590aaa15ea0f143b1e..0000000000000000000000000000000000000000 --- a/.dockerignore +++ /dev/null @@ -1,2 +0,0 @@ -lens -.git diff --git a/.gitattributes b/.gitattributes index d38175476330ebc679bc3ab6c4059a2b5f00ad7d..c7d9f3332a950355d5a77d85000f05e6f45435ea 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,4 +32,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text -*.pyc filter=lfs diff=lfs merge=lfs -text diff --git a/Dockerfile b/Dockerfile deleted file mode 100644 index b37462737be5068087d02d7f3e81b162491b5acd..0000000000000000000000000000000000000000 --- a/Dockerfile +++ /dev/null @@ -1,25 +0,0 @@ -FROM python:3.9 - -WORKDIR /code - -COPY ./requirements.txt /code/requirements.txt - -RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt - -# Set up a new user named "user" with user ID 1000 -RUN useradd -m -u 1000 user - -# Switch to the "user" user -USER user - -# Set home to the user's home directory -ENV HOME=/home/user \ - PATH=/home/user/.local/bin:$PATH - -# Set the working directory to the user's home directory -WORKDIR $HOME/app - -# Copy the current directory contents into the container at $HOME/app setting the owner to the user -COPY --chown=user . $HOME/app - -CMD ["python", "app.py"] diff --git a/README.md b/README.md index 9e77df2f9974291988a66ba8982098cef3473962..e60581a6aceb021d5b790f1bd06a12cd73c4921d 100644 --- a/README.md +++ b/README.md @@ -3,7 +3,10 @@ title: Tuned Lens emoji: 🔎 colorFrom: pink colorTo: blue -sdk: docker +sdk: gradio +python_version: 3.10.2 +sdk_version: 3.20.0 +app_file: app.py pinned: false license: mit --- diff --git a/__pycache__/app.cpython-310.pyc b/__pycache__/app.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..38be6ee86d10dd12e248744a482be6a6020aee6e Binary files /dev/null and b/__pycache__/app.cpython-310.pyc differ diff --git a/app.py b/app.py index 58ebd59e09e6b64b9720e81a568f5a111a532580..43005f713d4e76508b3232c1bc6a52e911782e2e 100644 --- a/app.py +++ b/app.py @@ -1,20 +1,17 @@ import torch from tuned_lens.nn.lenses import TunedLens, LogitLens from transformers import AutoModelForCausalLM, AutoTokenizer -from tuned_lens.plotting import PredictionTrajectory +from tuned_lens.plotting import plot_lens import gradio as gr from plotly import graph_objects as go device = torch.device("cpu") print(f"Using device {device} for inference") -model = AutoModelForCausalLM.from_pretrained("EleutherAI/pythia-410m-deduped") +model = AutoModelForCausalLM.from_pretrained("EleutherAI/pythia-410m-deduped-v0") model = model.to(device) -tokenizer = AutoTokenizer.from_pretrained("EleutherAI/pythia-410m-deduped") -tuned_lens = TunedLens.from_model_and_pretrained( - model=model, - map_location=device, -) -logit_lens = LogitLens.from_model(model) +tokenizer = AutoTokenizer.from_pretrained("EleutherAI/pythia-410m-deduped-v0") +tuned_lens = TunedLens.load("pythia-410m-deduped-v0", map_location=device) +logit_lens = LogitLens(model) lens_options_dict = { "Tuned Lens": tuned_lens, @@ -23,35 +20,32 @@ lens_options_dict = { statistic_options_dict = { "Entropy": "entropy", - "Cross Entropy": "cross_entropy", + "Cross Entropy": "ce", "Forward KL": "forward_kl", } def make_plot(lens, text, statistic, token_cutoff): - input_ids = tokenizer.encode(text) - input_ids = [tokenizer.bos_token_id] + input_ids - targets = input_ids[1:] + [tokenizer.eos_token_id] + input_ids = tokenizer.encode(text, return_tensors="pt") - if len(input_ids) == 1: + if len(input_ids[0]) == 0: return go.Figure(layout=dict(title="Please enter some text.")) if token_cutoff < 1: return go.Figure(layout=dict(title="Please provide valid token cut off.")) - start_pos=max(len(input_ids) - token_cutoff, 0) - pred_traj = PredictionTrajectory.from_lens_and_model( - lens=lens_options_dict[lens], - model=model, + fig = plot_lens( + model, + tokenizer, + lens_options_dict[lens], + layer_stride=2, input_ids=input_ids, - tokenizer=tokenizer, - targets=targets, - start_pos=start_pos, + start_pos=max(len(input_ids[0]) - token_cutoff, 0), + statistic=statistic_options_dict[statistic], ) - return getattr(pred_traj, statistic_options_dict[statistic])().figure( - title=f"{lens} ({model.name_or_path}) {statistic}", - ) + return fig + preamble = """ # The Tuned Lens 🔎 @@ -114,4 +108,5 @@ with gr.Blocks() as demo: demo.load(make_plot, [lens_options, text, statistic, token_cutoff], plot) if __name__ == "__main__": - demo.launch(server_name="0.0.0.0", server_port=7860) + demo.launch() + diff --git a/lens/CarperAI/stable-vicuna-13b/config.json b/lens/CarperAI/stable-vicuna-13b/config.json deleted file mode 100644 index d4281e1ab276a7318e54f8433900a37ac52d4d21..0000000000000000000000000000000000000000 --- a/lens/CarperAI/stable-vicuna-13b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "vicuna-13b", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "270c781d8280754a30abaf6fc186b1d754cc5d6bb17173d572d5517d5c7c702c", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/CarperAI/stable-vicuna-13b/params.pt b/lens/CarperAI/stable-vicuna-13b/params.pt deleted file mode 100644 index 9a012ea51f7eeacd26a74dd2590a6d6b4aa20d32..0000000000000000000000000000000000000000 --- a/lens/CarperAI/stable-vicuna-13b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:47afb57632ac509a309e75da139e666ba5c7e93f2a305b2e286d7e748b7cc476 -size 2097581027 diff --git a/lens/EleutherAI/gpt-neox-20b/config.json b/lens/EleutherAI/gpt-neox-20b/config.json deleted file mode 100644 index 1155cb089d682f661ea3d7891b23ad210495246e..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/gpt-neox-20b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/gpt-neox-20b", "d_model": 6144, "num_hidden_layers": 44, "bias": true, "base_model_revision": "4e49eadb5d14bd22f314ec3f45b69a87b88c7691", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/gpt-neox-20b/params.pt b/lens/EleutherAI/gpt-neox-20b/params.pt deleted file mode 100644 index 65b6a67bb1fdd7a589ada885154d6e19dd5c94d7..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/gpt-neox-20b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e3c0e5911cbdabd33e5a59112eefb4f234a487fac77f830be7fc238ffb72e776 -size 6644881483 diff --git a/lens/EleutherAI/pythia-1.4b-deduped-v0/config.json b/lens/EleutherAI/pythia-1.4b-deduped-v0/config.json deleted file mode 100644 index b70300d227b9071d232c7777c85e0cb673a512c2..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1.4b-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-1.4b-deduped-v0", "d_model": 2048, "num_hidden_layers": 24, "bias": true, "base_model_revision": "b541e01fddacd3038799915cf8ff5b52e835a6c4", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-1.4b-deduped-v0/params.pt b/lens/EleutherAI/pythia-1.4b-deduped-v0/params.pt deleted file mode 100644 index 0a812423ccb63d0da79463cb3e1aa2e6e628a328..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1.4b-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:713d414666c3a99f4e08cbfb700e40ba551989a2d99bba9e649e7b568f6e3974 -size 402860707 diff --git a/lens/EleutherAI/pythia-1.4b-deduped/config.json b/lens/EleutherAI/pythia-1.4b-deduped/config.json deleted file mode 100644 index 1c7122dc18b77ca08d43368e42a4a79d0bc35fcb..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1.4b-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-1.4b-deduped", "d_model": 2048, "num_hidden_layers": 24, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-1.4b-deduped/params.pt b/lens/EleutherAI/pythia-1.4b-deduped/params.pt deleted file mode 100644 index 7df56ff54fa89ae6231be400ae6ae2583cd92364..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1.4b-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b56db530d2c0df1bc5916bae58b241cfd4389dd4b1aa29e7210395df97164824 -size 402861347 diff --git a/lens/EleutherAI/pythia-12b-deduped-v0/config.json b/lens/EleutherAI/pythia-12b-deduped-v0/config.json deleted file mode 100644 index 15730b71a08276923eeb5f86fe92e8921ec6e997..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-12b-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-12b-deduped-v0", "d_model": 5120, "num_hidden_layers": 36, "bias": true, "base_model_revision": "b497662035bf3c80b4f6a1ddfe09bc27763e843a", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-12b-deduped-v0/params.pt b/lens/EleutherAI/pythia-12b-deduped-v0/params.pt deleted file mode 100644 index 6443964b3ee51dd8a454c9d0d3d004d9b3558ad2..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-12b-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a9e34c28c900b7230afe7ae1dc99b58b82c22b3265de2cbf939e3946cdcec126 -size 3775627331 diff --git a/lens/EleutherAI/pythia-12b-deduped/config.json b/lens/EleutherAI/pythia-12b-deduped/config.json deleted file mode 100644 index fad7d3daca2615ee1d7e2947d6d1727fbc4cb7df..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-12b-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-12b-deduped", "d_model": 5120, "num_hidden_layers": 36, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-12b-deduped/params.pt b/lens/EleutherAI/pythia-12b-deduped/params.pt deleted file mode 100644 index 77991b01e3f6fc78dcb5e2570fdf57a32ed7aa42..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-12b-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8452947780e3caf7009a752d62f1a2d71c66f67b3855c7e409869b7e633db40e -size 3775628355 diff --git a/lens/EleutherAI/pythia-160m-deduped-v0/config.json b/lens/EleutherAI/pythia-160m-deduped-v0/config.json deleted file mode 100644 index dac7a4bbfe63e2cd1af368c20d87c6ccbafc6d93..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-160m-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-160m-deduped-v0", "d_model": 768, "num_hidden_layers": 12, "bias": true, "base_model_revision": "7e57cc978f5da949f028f36b5baf8f5d6c3281b1", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-160m-deduped-v0/params.pt b/lens/EleutherAI/pythia-160m-deduped-v0/params.pt deleted file mode 100644 index 253e92be50d71b080bf298aad2c57e52e051ac28..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-160m-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9644fe7196ae4ab63ce2ce1c7a22f63ae548021a27bac57c4c1cdd200d982cf8 -size 28353795 diff --git a/lens/EleutherAI/pythia-160m-deduped/config.json b/lens/EleutherAI/pythia-160m-deduped/config.json deleted file mode 100644 index 8292296cdfb48f0de06f36ed9036f9981b9464c0..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-160m-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-160m-deduped", "d_model": 768, "num_hidden_layers": 12, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-160m-deduped/params.pt b/lens/EleutherAI/pythia-160m-deduped/params.pt deleted file mode 100644 index 54317bf887ad3d0f621d30272acf59ce85514233..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-160m-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1d16b68baa1eb903bbf74eaf859cee5c34361f3e8dff331b17f55b8ce52a2dbe -size 28354051 diff --git a/lens/EleutherAI/pythia-1b-deduped-v0/config.json b/lens/EleutherAI/pythia-1b-deduped-v0/config.json deleted file mode 100644 index f677b115f68397c0ded54a0adb6e71332e8fcd47..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1b-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-1b-deduped-v0", "d_model": 2048, "num_hidden_layers": 16, "bias": true, "base_model_revision": "021f79f50ff000ae1c159e22402ffec62284664d", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-1b-deduped-v0/params.pt b/lens/EleutherAI/pythia-1b-deduped-v0/params.pt deleted file mode 100644 index 0e0fe40e615b24803dcef833855f4a529b5c06bc..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-1b-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e10ed1a0b10251aaf1b7c542f14ad2c7a850103dfdffcd9da3d21e107d779eeb -size 268573731 diff --git a/lens/EleutherAI/pythia-2.8b-deduped-v0/config.json b/lens/EleutherAI/pythia-2.8b-deduped-v0/config.json deleted file mode 100644 index 6dde57245db5a5f4391bd8d889f64003fa124a11..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-2.8b-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-2.8b-deduped-v0", "d_model": 2560, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-2.8b-deduped-v0/params.pt b/lens/EleutherAI/pythia-2.8b-deduped-v0/params.pt deleted file mode 100644 index cdf87ecbb6fb2881c989b2080b03544dbbbe73ce..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-2.8b-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f7892bd4af71a436aaba3a650ea907c94a077b8f16eb343c9a8762872c73026f -size 839204003 diff --git a/lens/EleutherAI/pythia-2.8b-deduped/config.json b/lens/EleutherAI/pythia-2.8b-deduped/config.json deleted file mode 100644 index 5a60f82c1eb9cddba8b046fbbc63002755a8d7f7..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-2.8b-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-2.8b-deduped", "d_model": 2560, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-2.8b-deduped/params.pt b/lens/EleutherAI/pythia-2.8b-deduped/params.pt deleted file mode 100644 index f08825ff4500d8fe43cfa7fc53c70ed70948c2e7..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-2.8b-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:314d403f2e1b1bf575ab2e851419d3a687c54138bfae5feace3ff00f1a96fd60 -size 839204003 diff --git a/lens/EleutherAI/pythia-410m-deduped-v0/config.json b/lens/EleutherAI/pythia-410m-deduped-v0/config.json deleted file mode 100644 index 7e4025c075430cb5e177f8cc75c9b0caff2439a0..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-410m-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-410m-deduped-v0", "d_model": 1024, "num_hidden_layers": 24, "bias": true, "base_model_revision": "3538d3569a7e313e445ad6401c92c6e16777a2da", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-410m-deduped-v0/params.pt b/lens/EleutherAI/pythia-410m-deduped-v0/params.pt deleted file mode 100644 index 6a2fc58a64a8efda7c5ad9cb454d92f65a47006a..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-410m-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:257a17d052d6bda84f338b1aa22ded8c17c401e1299b64cdab521178708ee7ac -size 100772515 diff --git a/lens/EleutherAI/pythia-410m-deduped/config.json b/lens/EleutherAI/pythia-410m-deduped/config.json deleted file mode 100644 index ee5bf8aff434ca741ef753de5fc2e3dc3b031a03..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-410m-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-410m-deduped", "d_model": 1024, "num_hidden_layers": 24, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-410m-deduped/params.pt b/lens/EleutherAI/pythia-410m-deduped/params.pt deleted file mode 100644 index 1cc539359351cb8accfaa5b86cccdcbe2c3802ea..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-410m-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:166ea259b35481e1eb2feba50b5ac4d9a8faed47b0937ede0d7bd6d9830dbc95 -size 100773155 diff --git a/lens/EleutherAI/pythia-6.9b-deduped-v0/config.json b/lens/EleutherAI/pythia-6.9b-deduped-v0/config.json deleted file mode 100644 index 27e094938885d74b953f99510863cf57a30c1310..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-6.9b-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-6.9b-deduped-v0", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": "cbd53efc2e56056e3bd0235277b5d0b668a6dfbb", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-6.9b-deduped-v0/params.pt b/lens/EleutherAI/pythia-6.9b-deduped-v0/params.pt deleted file mode 100644 index 2621022d862ecd0aad7cfd9fafbbb7d7be6ef26e..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-6.9b-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3c99da7167d4a45a71c2f04c2db4d716a7a63f27406cb8948c9cb9f6c052b91c -size 2148022563 diff --git a/lens/EleutherAI/pythia-6.9b-deduped/config.json b/lens/EleutherAI/pythia-6.9b-deduped/config.json deleted file mode 100644 index 3e1bcd580e9a92cd37f70c7671e334b6bcd740f8..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-6.9b-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-6.9b-deduped", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-6.9b-deduped/params.pt b/lens/EleutherAI/pythia-6.9b-deduped/params.pt deleted file mode 100644 index 454fbdcecc7f13d90c2dbb19fccb5580acab72c5..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-6.9b-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2d00af6f64631b932b089fac5ca031061e207d51132a0f7433bd7a34fb06da0 -size 2148023459 diff --git a/lens/EleutherAI/pythia-70m-deduped-v0/config.json b/lens/EleutherAI/pythia-70m-deduped-v0/config.json deleted file mode 100644 index a030b8a54af4a856d61d819da05a89f1a5b6ea1c..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-70m-deduped-v0/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-70m-deduped-v0", "d_model": 512, "num_hidden_layers": 6, "bias": true, "base_model_revision": "ec30f7539a604fcb0b7fbba04fb1eb0110735d29", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-70m-deduped-v0/params.pt b/lens/EleutherAI/pythia-70m-deduped-v0/params.pt deleted file mode 100644 index 3fcdf8bb9b2bf16ebeb477015bc90369499624f6..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-70m-deduped-v0/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cbfc06e4d8733b1fccd5e1bb9cabd845072abfc8b92902ae1bbcbb2763fbc014 -size 6306739 diff --git a/lens/EleutherAI/pythia-70m-deduped/config.json b/lens/EleutherAI/pythia-70m-deduped/config.json deleted file mode 100644 index af95bb2b068b60d7d6fcb7b4e067296c74eedcb6..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-70m-deduped/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "EleutherAI/pythia-70m-deduped", "d_model": 512, "num_hidden_layers": 6, "bias": true, "base_model_revision": null, "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/EleutherAI/pythia-70m-deduped/params.pt b/lens/EleutherAI/pythia-70m-deduped/params.pt deleted file mode 100644 index b374fb1fe4c9f0f8eec2cf4a9f5c60742c624664..0000000000000000000000000000000000000000 --- a/lens/EleutherAI/pythia-70m-deduped/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c363b641564af68e9f9b73af56015b6b5c5b08caea5880787744eaabfab01343 -size 6306803 diff --git a/lens/facebook/llama-13b/config.json b/lens/facebook/llama-13b/config.json deleted file mode 100644 index 164088bcbd4e14d8e9a1f9d3dd87a1ec66f0bc32..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-13b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "huggyllama/llama-13b", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "86cefdfd94bb3da225b405dd1328136786f6177b03d82f90e5c734d23c47e8ca", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/llama-13b/params.pt b/lens/facebook/llama-13b/params.pt deleted file mode 100644 index 77963d1952531ca707f410ee53c72ff402106891..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-13b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2700859b4335f4e4bdd4040232f594170bb717f8af04f65e5560c49cfb6da122 -size 2097581027 diff --git a/lens/facebook/llama-30b/config.json b/lens/facebook/llama-30b/config.json deleted file mode 100644 index 9acceec1235efe0c7170736687e0f69ed708d99a..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-30b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "huggyllama/llama-30b", "d_model": 6656, "num_hidden_layers": 60, "bias": true, "base_model_revision": null, "unembed_hash": "512b41bb8fc0e2b3647a877b5e114ca9503d7c800185b14a8e7ad9e921424367", "lens_type": "linear_tuned_lens"} diff --git a/lens/facebook/llama-30b/params.pt b/lens/facebook/llama-30b/params.pt deleted file mode 100644 index e705b2e99e3ece945c0c2e5b6bb9bc9c2ede59ed..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-30b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:10e781269b476a6de8f4ac12ea3f8b20fe22d3a8ca8cfdf770366a5f4e36c78f -size 5317111487 diff --git a/lens/facebook/llama-65b/config.json b/lens/facebook/llama-65b/config.json deleted file mode 100644 index 3fba9f1386a5a6a77601d7dad201eb03b820940b..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-65b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "huggyllama/llama-65b", "d_model": 8192, "num_hidden_layers": 80, "bias": true, "base_model_revision": null, "unembed_hash": "8ffc2dbf80dd5c131c4be9e347d090856bef2dbc973433dbd42ca9257b00d5e1", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/llama-65b/params.pt b/lens/facebook/llama-65b/params.pt deleted file mode 100644 index 312d6cf0a3b655581cc4ae8cb18908523565a9c7..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-65b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c9199874796630e1be615b0b34cd48e7f37ed09c6140153cdf6b7c509c45361b -size 10738779199 diff --git a/lens/facebook/llama-7b/config.json b/lens/facebook/llama-7b/config.json deleted file mode 100644 index 975a70715c914c2668eb088234b11e2dd41ba810..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-7b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "huggyllama/llama-7b", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "7d0c2d720d286bdd706e662ea04f327204090f7d54054b0d5faabbc1b06a72fe", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/llama-7b/params.pt b/lens/facebook/llama-7b/params.pt deleted file mode 100644 index a27dd4210f1d327467fa102025014bc2b2d25701..0000000000000000000000000000000000000000 --- a/lens/facebook/llama-7b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:02186a08b29e7173ae229218823b65891a7b2f2eadf0e69baf44a9c62b55a7cf -size 1074019491 diff --git a/lens/facebook/opt-1.3b/config.json b/lens/facebook/opt-1.3b/config.json deleted file mode 100644 index 7f1985c200e88f908717cb2b21fbcdb4a8d9d975..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-1.3b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "facebook/opt-1.3b", "d_model": 2048, "num_hidden_layers": 24, "bias": true, "base_model_revision": "8c7b10754972749675d22364c25c428b29face51", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/opt-1.3b/params.pt b/lens/facebook/opt-1.3b/params.pt deleted file mode 100644 index 2655789e5336bcd918a9b6fee1675bf8abb196c5..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-1.3b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2b5620752d01fcca26f5b7c36ec2b741974b570adfb64bffbd901cdc01dc9df9 -size 402860707 diff --git a/lens/facebook/opt-125m/config.json b/lens/facebook/opt-125m/config.json deleted file mode 100644 index 5b7e5a5d612c8bfe9bdd02327920d72d95764406..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-125m/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "facebook/opt-125m", "d_model": 768, "num_hidden_layers": 12, "bias": true, "base_model_revision": "3d2b5f275bdf882b8775f902e1bfdb790e2cfc32", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/opt-125m/params.pt b/lens/facebook/opt-125m/params.pt deleted file mode 100644 index 37d89822fe6b9ad87fba762c25cfe629d1b7604f..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-125m/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f61d7716618783244f2e7f5d26022df092b80695e9620ccb02c5ffb70f9b1405 -size 28353795 diff --git a/lens/facebook/opt-6.7b/config.json b/lens/facebook/opt-6.7b/config.json deleted file mode 100644 index 749d4eb6b8873415c1007325a6a5a826d88df853..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-6.7b/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "facebook/opt-6.7b", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": "a45aa65bbeb77c1558bc99bedc6779195462dab0", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/facebook/opt-6.7b/params.pt b/lens/facebook/opt-6.7b/params.pt deleted file mode 100644 index 370a5187c68be80dcfb8236910f16a05c6382579..0000000000000000000000000000000000000000 --- a/lens/facebook/opt-6.7b/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9580fbf6e967c1be832ef415f3f74c0f6ee111637fba253dc5a75216dc305ebb -size 2148022563 diff --git a/lens/gpt-neox-20b/config.json b/lens/gpt-neox-20b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..818ff1e0ec18d827800e4d14ab40a1105c14bb6d --- /dev/null +++ b/lens/gpt-neox-20b/config.json @@ -0,0 +1 @@ +{"bias": true, "identity_init": true, "include_input": true, "include_final": false, "orthogonal": false, "rank": null, "sublayers": false, "d_model": 6144, "num_layers": 44, "vocab_size": 50432} \ No newline at end of file diff --git a/lens/gpt-neox-20b/params.pt b/lens/gpt-neox-20b/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2c5e1cb3e60120ca63aa239cafbb5056dae974 --- /dev/null +++ b/lens/gpt-neox-20b/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774144e329ee3741d0a7fff85b342f1a996aa24c788c3f741b03df596948a66d +size 3942186487 diff --git a/lens/gpt2-large/config.json b/lens/gpt2-large/config.json index 7c2825e5fc02e2c8e9a28b319d9530edb8e5028c..b77d79dfa8f30c3ab6c3bee00b32bb5aaa2e4cb9 100644 --- a/lens/gpt2-large/config.json +++ b/lens/gpt2-large/config.json @@ -1 +1,7 @@ -{"base_model_name_or_path": "gpt2-large", "d_model": 1280, "num_hidden_layers": 36, "bias": true, "base_model_revision": "212095d5832abbf9926672e1c1e8d14312a3be20", "lens_type": "linear_tuned_lens"} \ No newline at end of file +{ + "include_input": true, + "num_layers": 36, + "vocab_size": 50257, + "bias": true, + "d_model": 1280 +} \ No newline at end of file diff --git a/lens/gpt2-large/params.pt b/lens/gpt2-large/params.pt index 11721a616e583e0f782cbaec169935bce8f28793..be7f8750d070f3931c3210fda07f01cd5baab57f 100644 --- a/lens/gpt2-large/params.pt +++ b/lens/gpt2-large/params.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:291a85a7f524378221e2af0814c2a98c68f740c38993a0b62863f50adb3231db -size 236130371 +oid sha256:900bde39d9ad903985824852171f40ae406969dd7e92d1b5003f4208e4651b51 +size 493459767 diff --git a/lens/gpt2-xl/config.json b/lens/gpt2-xl/config.json index a7c0cd65adc019e4c81421676462caf8d77c0e84..d945ceba22211eb0f1095400d94716ffc5b8a76d 100644 --- a/lens/gpt2-xl/config.json +++ b/lens/gpt2-xl/config.json @@ -1 +1,7 @@ -{"base_model_name_or_path": "gpt2-xl", "d_model": 1600, "num_hidden_layers": 48, "bias": true, "base_model_revision": "33cdb5c0db5423c1879b1b9f16c352988e8754a8", "lens_type": "linear_tuned_lens"} \ No newline at end of file +{ + "bias": true, + "include_input": true, + "d_model": 1600, + "num_layers": 48, + "vocab_size": 50257 +} \ No newline at end of file diff --git a/lens/gpt2-xl/params.pt b/lens/gpt2-xl/params.pt index b708a28df8e21045187dd0c51d35638dda4b5f63..b0b456133fde8e88972c9b88cb4dd66c94146c67 100644 --- a/lens/gpt2-xl/params.pt +++ b/lens/gpt2-xl/params.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7c9b8eaf307a87965188d2311ee4d90d3c7868611e20aab263bc8e30b51320b6 -size 491849251 +oid sha256:96ea1cf6b4fa0c22710e7dd64499fecff2f4f6b0f1fb5f9d277d43e46cf88947 +size 813510935 diff --git a/lens/gpt2/config.json b/lens/gpt2/config.json index 4f43d2940b170aa19b31d295d5f10bd0d2908c85..98165995862877166684e857141a9b6e1e302184 100644 --- a/lens/gpt2/config.json +++ b/lens/gpt2/config.json @@ -1 +1,7 @@ -{"base_model_name_or_path": "gpt2", "d_model": 768, "num_hidden_layers": 12, "bias": true, "base_model_revision": "e7da7f221d5bf496a48136c0cd264e630fe9fcc8", "lens_type": "linear_tuned_lens"} \ No newline at end of file +{ + "bias": true, + "include_input": true, + "d_model": 768, + "num_layers": 12, + "vocab_size": 50257 +} \ No newline at end of file diff --git a/lens/gpt2/params.pt b/lens/gpt2/params.pt index 14b0d7bcd5da3db569f3ba3c3daf0c46a17d5c31..c8aad7f0bc34c5c13a7bfd1f97f7b23780444d19 100644 --- a/lens/gpt2/params.pt +++ b/lens/gpt2/params.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1e0494dcf4a56a77b73b421820941ea948ffae0c6a0391d88c9cb10b48bc19c8 -size 28353795 +oid sha256:9310b4ce09a053b38aa79dab8616309dc37db0d74a58ed683c1347859f9d9343 +size 182751031 diff --git a/lens/lmsys/vicuna-13b-v1.1/config.json b/lens/lmsys/vicuna-13b-v1.1/config.json deleted file mode 100644 index bdf4940362d37b864123cdd5dff5d3c4e16960de..0000000000000000000000000000000000000000 --- a/lens/lmsys/vicuna-13b-v1.1/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "vicuna-original-13b", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "86cefdfd94bb3da225b405dd1328136786f6177b03d82f90e5c734d23c47e8ca", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/lmsys/vicuna-13b-v1.1/params.pt b/lens/lmsys/vicuna-13b-v1.1/params.pt deleted file mode 100644 index 9dad719390e626dba1190c154fa447f8787a7728..0000000000000000000000000000000000000000 --- a/lens/lmsys/vicuna-13b-v1.1/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0281f46b65b728cb390e41bd5848d8ab635b2847b48c080b2de2b78627baa40d -size 2097581027 diff --git a/lens/meta-llama/Llama-2-13b-chat-hf/config.json b/lens/meta-llama/Llama-2-13b-chat-hf/config.json deleted file mode 100644 index f17140a4f80243723d54207d8ac7e03fdb330122..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-chat-hf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-13b-chat-hf", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "05e6ab11c049cc1356b38bf9ff84ffbedaf802a3c7fdda9e763bca0c4e9de2ab", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/config.json b/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/config.json deleted file mode 100644 index f17140a4f80243723d54207d8ac7e03fdb330122..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-13b-chat-hf", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "05e6ab11c049cc1356b38bf9ff84ffbedaf802a3c7fdda9e763bca0c4e9de2ab", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/params.pt b/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/params.pt deleted file mode 100644 index 00d178b9504b367bde551a75a87967c13b1b490e..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-chat-hf/hh-rlhf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ceabb160e1b3ff887232514159bdf22c7f109a585759284eb7b18e72fb27667 -size 2097581027 diff --git a/lens/meta-llama/Llama-2-13b-chat-hf/params.pt b/lens/meta-llama/Llama-2-13b-chat-hf/params.pt deleted file mode 100644 index 8878ffe397eef446c401301a230513e804a7ed3c..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-chat-hf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6a8af029394d9be03e6a9a75a03ac477fdb9e42352ad3df035439bbb8ccb1b5d -size 2097581027 diff --git a/lens/meta-llama/Llama-2-13b-hf/config.json b/lens/meta-llama/Llama-2-13b-hf/config.json deleted file mode 100644 index 1b1b533d83452fd33a6097eae099b83e77d07381..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-hf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-13b-hf", "d_model": 5120, "num_hidden_layers": 40, "bias": true, "base_model_revision": null, "unembed_hash": "1f421a88f21fcda6d1c8c17a481c46918d355f8b06cfc77b05cf738e11b55f7a", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-13b-hf/params.pt b/lens/meta-llama/Llama-2-13b-hf/params.pt deleted file mode 100644 index 4c904cb27b20f39f57d91de533fa5ce150b0f9dc..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-13b-hf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f87b2a5f2b3125d9e49343cbac244b901795e3af4117ec0f6ee428f79027778d -size 2097581027 diff --git a/lens/meta-llama/Llama-2-7b-chat-hf/config.json b/lens/meta-llama/Llama-2-7b-chat-hf/config.json deleted file mode 100644 index bb3da5d9cee530daa8f738438cd6ba26d83ab206..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-chat-hf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-7b-chat-hf", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "3313b62209f366e7b19233ae7068501553350611c20f96caf2499c0486f8836b", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/config.json b/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/config.json deleted file mode 100644 index bb3da5d9cee530daa8f738438cd6ba26d83ab206..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-7b-chat-hf", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "3313b62209f366e7b19233ae7068501553350611c20f96caf2499c0486f8836b", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/params.pt b/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/params.pt deleted file mode 100644 index 6a79df8fb5174a0247bde4a21d2e97fa7164dac2..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-chat-hf/hh-rlhf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:86abc8c2a2044c3a70e88291b636222a6db6cdb25af51e86108e479843a2326e -size 2148023459 diff --git a/lens/meta-llama/Llama-2-7b-chat-hf/params.pt b/lens/meta-llama/Llama-2-7b-chat-hf/params.pt deleted file mode 100644 index d1823473cf01a7693e47ccbb1ab7699947174315..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-chat-hf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c66e7d56afd044bc6472e91bf6103ee5ab837c5953b44c791b0f1f8ac8ce8578 -size 2148023459 diff --git a/lens/meta-llama/Llama-2-7b-hf/config.json b/lens/meta-llama/Llama-2-7b-hf/config.json deleted file mode 100644 index 168bd6faa0a846012d95ae8bd515aeba928f7d61..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-hf/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Llama-2-7b-hf", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "3313b62209f366e7b19233ae7068501553350611c20f96caf2499c0486f8836b", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Llama-2-7b-hf/params.pt b/lens/meta-llama/Llama-2-7b-hf/params.pt deleted file mode 100644 index 0239435da2308cf03cd2727b4b248fd8d2f26a11..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Llama-2-7b-hf/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bc13d3a19107877e868019505dbc6428d594c573edcac2c28d1017dd521f8fb3 -size 2148023459 diff --git a/lens/meta-llama/Meta-Llama-3-8B-Instruct/config.json b/lens/meta-llama/Meta-Llama-3-8B-Instruct/config.json deleted file mode 100644 index dab3bf51e71356b28f3d989feb7fa7cddd87ecfb..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Meta-Llama-3-8B-Instruct/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Meta-Llama-3-8B-Instruct", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "fdd74d04451fa6853022839edeccc6a288ebdbae0f0371d8ca2316325be7e925", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Meta-Llama-3-8B-Instruct/params.pt b/lens/meta-llama/Meta-Llama-3-8B-Instruct/params.pt deleted file mode 100644 index 210447ac1e23844c4bb4521444e17484d51c715b..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Meta-Llama-3-8B-Instruct/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0c1869e84c1d4f27d7ae6a46199daeee8c828db47c07438e0bc23d9b25b1166d -size 2148023890 diff --git a/lens/meta-llama/Meta-Llama-3-8B/config.json b/lens/meta-llama/Meta-Llama-3-8B/config.json deleted file mode 100644 index 03e39b6f6d7d09d46e5388203c4dde8f22953fe3..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Meta-Llama-3-8B/config.json +++ /dev/null @@ -1 +0,0 @@ -{"base_model_name_or_path": "meta-llama/Meta-Llama-3-8B", "d_model": 4096, "num_hidden_layers": 32, "bias": true, "base_model_revision": null, "unembed_hash": "de7042374eeecd4a3a6243327929653305d241c950c5dd79b6609d2d76390aa6", "lens_type": "linear_tuned_lens"} \ No newline at end of file diff --git a/lens/meta-llama/Meta-Llama-3-8B/params.pt b/lens/meta-llama/Meta-Llama-3-8B/params.pt deleted file mode 100644 index 386c6cf954858835adb10acd0215959fb8f70ffe..0000000000000000000000000000000000000000 --- a/lens/meta-llama/Meta-Llama-3-8B/params.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a2a0cf218333d8c33fbcc24b051ddf5afcdb4d240999626ca937f81e23b90967 -size 2148023890 diff --git a/lens/opt-1.3b/config.json b/lens/opt-1.3b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d3d80c3f883440ec337ea2a426335025613a7d29 --- /dev/null +++ b/lens/opt-1.3b/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "layer_norm": false, "mlp_hidden_sizes": [], "rank": null, "shared_mlp_hidden_sizes": [], "share_weights": false, "sublayers": false, "num_layers": 24, "vocab_size": 50272, "bias": true, "d_model": 2048} \ No newline at end of file diff --git a/lens/opt-1.3b/params.pt b/lens/opt-1.3b/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..1926c18b19fbe31095d36824f4927343537eb27f --- /dev/null +++ b/lens/opt-1.3b/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2f68f2cdb252dd1019ee745f71fc016506064ee1811ef103ceecc93c31c9dc +size 814707799 diff --git a/lens/opt-125m/config.json b/lens/opt-125m/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df1588d24037875cac8705c337bbd95ccc18a029 --- /dev/null +++ b/lens/opt-125m/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "layer_norm": false, "mlp_hidden_sizes": [], "rank": null, "shared_mlp_hidden_sizes": [], "share_weights": false, "sublayers": false, "num_layers": 12, "vocab_size": 50272, "bias": true, "d_model": 768} \ No newline at end of file diff --git a/lens/opt-125m/params.pt b/lens/opt-125m/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e73fd47177cb04821ba224efc8c202f968bb0ec --- /dev/null +++ b/lens/opt-125m/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae8648dc89c2b7ae903d231b2d38d87616dae5ffec7e79e3e549fec8207c159 +size 182797111 diff --git a/lens/opt-6.7b/config.json b/lens/opt-6.7b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..38f99d228b9627c653844ffb91568ded64855a98 --- /dev/null +++ b/lens/opt-6.7b/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "layer_norm": false, "mlp_hidden_sizes": [], "rank": null, "shared_mlp_hidden_sizes": [], "share_weights": false, "sublayers": false, "num_layers": 32, "vocab_size": 50272, "bias": true, "d_model": 4096} \ No newline at end of file diff --git a/lens/opt-6.7b/params.pt b/lens/opt-6.7b/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..92aa5e43476b4ee7f389ebaaaf64b8ca42e7a171 --- /dev/null +++ b/lens/opt-6.7b/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc4721db7049a4d0e9b84a07c44e58da28c778ba58bd42540e58507e2664fc10 +size 2971714775 diff --git a/lens/pythia-1.4b-deduped-v0/config.json b/lens/pythia-1.4b-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c1c6d3aac33f1fa1b16ed9062392f2271c280341 --- /dev/null +++ b/lens/pythia-1.4b-deduped-v0/config.json @@ -0,0 +1 @@ +{"identity_init": true, "include_input": true, "rank": null, "shared_mlp_hidden_sizes": [], "sublayers": false, "num_layers": 24, "vocab_size": 50304, "bias": true, "d_model": 2048, "dropout": 0.0, "mlp_hidden_sizes": []} \ No newline at end of file diff --git a/lens/pythia-1.4b-deduped-v0/params.pt b/lens/pythia-1.4b-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..2182e0b08ebee33f04e33dadaa6443fcfb3627dc --- /dev/null +++ b/lens/pythia-1.4b-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993076b6486e55555a3699f44d74ede2235db26df9c61bccfed338077b6c8474 +size 814969879 diff --git a/lens/pythia-12b-deduped-v0/config.json b/lens/pythia-12b-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..973105b36ea619d30d67d7a7c0bf64ab27ddecdb --- /dev/null +++ b/lens/pythia-12b-deduped-v0/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "mlp_hidden_sizes": [], "rank": null, "shared_mlp_hidden_sizes": [], "share_weights": false, "sublayers": false, "num_layers": 36, "vocab_size": 50688, "bias": true, "d_model": 5120} \ No newline at end of file diff --git a/lens/pythia-12b-deduped-v0/params.pt b/lens/pythia-12b-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b85883e3eb5ad1b7facc700e34114d7f58481f7 --- /dev/null +++ b/lens/pythia-12b-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca1e95270638a16156cc21f3358ad70162b79d58f1c5e84a5307a72ac4fa97d +size 4813762539 diff --git a/lens/pythia-160m-deduped-v0/config.json b/lens/pythia-160m-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..98c7e64ba766c7059d50c38a1c1bf809b213a2a0 --- /dev/null +++ b/lens/pythia-160m-deduped-v0/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "rank": null, "shared_mlp_hidden_sizes": [], "sublayers": false, "num_layers": 12, "vocab_size": 50304, "bias": true, "d_model": 768, "mlp_hidden_sizes": []} \ No newline at end of file diff --git a/lens/pythia-160m-deduped-v0/params.pt b/lens/pythia-160m-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..56b28388aaf5d231b39a287926a84e0e1ef52547 --- /dev/null +++ b/lens/pythia-160m-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f5da07bcfe2acce3088562897bab4ac871382c64b9a35eea9e4bfd1a5c075d +size 182895415 diff --git a/lens/pythia-1b-deduped-v0/config.json b/lens/pythia-1b-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..912f3cade09357275f54f2ad51ebaf3f1c2d6275 --- /dev/null +++ b/lens/pythia-1b-deduped-v0/config.json @@ -0,0 +1 @@ +{"identity_init": true, "include_input": true, "rank": null, "shared_mlp_hidden_sizes": [], "sublayers": false, "num_layers": 16, "vocab_size": 50304, "bias": true, "d_model": 2048, "dropout": 0.0, "mlp_hidden_sizes": []} \ No newline at end of file diff --git a/lens/pythia-1b-deduped-v0/params.pt b/lens/pythia-1b-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..38df94e88625d5fd2567f9bab7be3df256349c88 --- /dev/null +++ b/lens/pythia-1b-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c83f3fdb656c409e8cf2c5ecef1a4aba7d2bfd1f3fe4e0fa1b24602fc03279 +size 680682391 diff --git a/lens/pythia-410m-deduped-v0/config.json b/lens/pythia-410m-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c143d288e9fc790a2538ed157d524b32b0d5ed53 --- /dev/null +++ b/lens/pythia-410m-deduped-v0/config.json @@ -0,0 +1 @@ +{"identity_init": true, "include_input": true, "rank": null, "shared_mlp_hidden_sizes": [], "sublayers": false, "num_layers": 24, "vocab_size": 50304, "bias": true, "d_model": 1024, "dropout": 0.0, "mlp_hidden_sizes": []} \ No newline at end of file diff --git a/lens/pythia-410m-deduped-v0/params.pt b/lens/pythia-410m-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ead4a244fe79b4c2d15134c9f771dc8872fa15 --- /dev/null +++ b/lens/pythia-410m-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93915ee38d64c003558d6b931e1c3ce964d70df53415d6695b489c2789fea84 +size 306828311 diff --git a/lens/pythia-6.9b-deduped-v0/config.json b/lens/pythia-6.9b-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b276d6cb3e465c6d43ed405523e6c3b7e052f3f --- /dev/null +++ b/lens/pythia-6.9b-deduped-v0/config.json @@ -0,0 +1 @@ +{"identity_init": true, "include_input": true, "rank": null, "shared_mlp_hidden_sizes": [], "sublayers": false, "num_layers": 32, "vocab_size": 50432, "bias": true, "d_model": 4096, "dropout": 0.0, "mlp_hidden_sizes": []} \ No newline at end of file diff --git a/lens/pythia-6.9b-deduped-v0/params.pt b/lens/pythia-6.9b-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4c652b8a77ff3e347aa667aa8bd01b98e6f6ca5 --- /dev/null +++ b/lens/pythia-6.9b-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79de8a9a4cc3fdfcf8283b5eaee157eb627ea2798b1e806469d9af45a4663e43 +size 2974336215 diff --git a/lens/pythia-70m-deduped-v0/config.json b/lens/pythia-70m-deduped-v0/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ce8d1057deca17a44c1ee0a2ec721a47f840f17 --- /dev/null +++ b/lens/pythia-70m-deduped-v0/config.json @@ -0,0 +1 @@ +{"dropout": 0.0, "identity_init": true, "include_input": true, "mlp_hidden_sizes": [], "rank": null, "shared_mlp_hidden_sizes": [], "share_weights": false, "sublayers": false, "num_layers": 6, "vocab_size": 50304, "bias": true, "d_model": 512} \ No newline at end of file diff --git a/lens/pythia-70m-deduped-v0/params.pt b/lens/pythia-70m-deduped-v0/params.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c3acb09c4e6c567261c7bd1dfdc2f09cbc79bf5 --- /dev/null +++ b/lens/pythia-70m-deduped-v0/params.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc81f39274f8bb18da904101855903a3fbb885a21a27c5e4a66a90ce306f85d9 +size 109334503 diff --git a/requirements.txt b/requirements.txt index f8a583fdc0eb84bc4ddda4b09de05472d0ec79ef..94b94e6fccaba4602dd23495336c74ab5c8ba61e 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,2 +1 @@ -tuned_lens==0.1.0 -gradio \ No newline at end of file +tuned_lens==0.0.3