Upload 7 files

Browse files

Files changed (7) hide show

hierarchos_config.json +71 -0
merges.txt +0 -0
model.pt +3 -0
special_tokens_map.json +5 -0
tokenizer.json +0 -0
tokenizer_config.json +20 -0
vocab.json +0 -0

hierarchos_config.json ADDED Viewed

	@@ -0,0 +1,71 @@

+{
+  "mode": "train",
+  "train": true,
+  "hf_dataset": "tatsu-lab/alpaca",
+  "hf_dataset_config": null,
+  "hf_dataset_split": "train",
+  "text_column": null,
+  "prompt_column": "instruction",
+  "completion_column": "output",
+  "model_path": null,
+  "out_dir": "./rog_ally_model",
+  "lora_adapter_path": null,
+  "tokenizer_path": null,
+  "resume_from_ckpt": null,
+  "shadow_model_path": null,
+  "pre_chunked_dataset": false,
+  "pre_pt_dataset": false,
+  "context_dim": 384,
+  "persistent_dim": 128,
+  "ltm_slots": 1024,
+  "ltm_key_dim": 128,
+  "ltm_val_dim": 128,
+  "h_hidden": 384,
+  "l_hidden": 384,
+  "h_stride": 4,
+  "max_h_steps": 3,
+  "max_l_steps": 5,
+  "l_conv_atol": 0.0001,
+  "ltm_topk": 4,
+  "max_length": 1512,
+  "auto_max_length": true,
+  "epochs": 30,
+  "batch_size": 4,
+  "accumulation_steps": 1,
+  "starting_lr": 2e-06,
+  "min_lr": 9e-08,
+  "disable_lr_schedule": false,
+  "ltm_lr": 0.01,
+  "kayla": false,
+  "lora_r": 8,
+  "lora_alpha": 16,
+  "finetune_unlock_percent": null,
+  "quantize_on_complete": false,
+  "grad_clip": 1.0,
+  "ponder_loss_weight": 0.01,
+  "commitment_loss_weight": 0.5,
+  "commitment_threshold": 0.05,
+  "override_scheduling": false,
+  "num_workers": 0,
+  "amp": false,
+  "gradient_checkpointing": false,
+  "compile": true,
+  "force_compile": true,
+  "debug_anomaly": false,
+  "max_new_tokens": 512,
+  "enable_quantized_learning": false,
+  "ltm_lora_path": null,
+  "device": "cpu",
+  "h_halt_thresh": 0.9,
+  "static_ltm_lr": false,
+  "ltm_schedule_steps": 100,
+  "ltm_schedule_min_lr": 1e-05,
+  "qtype": "INT4",
+  "threads": 8,
+  "model_type": "hierarchos",
+  "is_hf_dataset": true,
+  "vocab_size": 50257,
+  "completed_epoch": 60,
+  "tokenizer_name": "openai-community/gpt2",
+  "converted_from": "hierarchos_epoch_60.pt"
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dca9b63e9024f10eff273967acc3485497e41dc3ebd04bbe6c69adfe5cebaebc
+size 100403096

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff