Upload 11 files

Browse files

Files changed (11) hide show

config.json +46 -0
data.json +76 -0
generation_config.json +6 -0
main.py +33 -0
merges.txt +0 -0
model.safetensors +3 -0
special_tokens_map.json +6 -0
tokenizer.json +0 -0
tokenizer_config.json +21 -0
train.py +47 -0
vocab.json +0 -0

config.json ADDED Viewed

	@@ -0,0 +1,46 @@

+{
+  "_name_or_path": "distilgpt2",
+  "_num_labels": 1,
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "id2label": {
+    "0": "LABEL_0"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0
+  },
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 6,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "vocab_size": 50257
+}

data.json ADDED Viewed

	@@ -0,0 +1,76 @@

+[
+    {"input": "What are your thoughts on $lockin?", "output": "Does $lockin seem like a good investment?"},
+    {"input": "Do you think $lockin will increase in value?", "output": "Is $lockin poised for a big price jump?"},
+    {"input": "How is $lockin doing in the market right now?", "output": "Is $lockin outperforming other assets?"},
+    {"input": "Should I buy more $lockin now?", "output": "Is now a good time to buy $lockin?"},
+    {"input": "What’s the future outlook for $lockin?", "output": "Will $lockin rise in the coming months?"},
+    {"input": "Is $lockin a safe investment?", "output": "Can $lockin be considered a safe bet?"},
+    {"input": "Do you recommend holding onto $lockin?", "output": "Should I hold $lockin long term?"},
+    {"input": "How does $lockin compare to other cryptocurrencies?", "output": "Is $lockin a better choice than other cryptocurrencies?"},
+    {"input": "Can $lockin reach $100 in the next year?", "output": "Will $lockin reach $100 within a year?"},
+    {"input": "What is the general market sentiment about $lockin?", "output": "Is the market positive about $lockin's future?"},
+    {"input": "What is the potential of $lockin?", "output": "Does $lockin have strong potential for growth?"},
+    {"input": "Is $lockin's price likely to increase this month?", "output": "Will $lockin’s price rise in the next 30 days?"},
+    {"input": "Should I invest in $lockin now or wait?", "output": "Is it wise to invest in $lockin right now?"},
+    {"input": "What is the current trend for $lockin?", "output": "Is $lockin currently in an uptrend?"},
+    {"input": "What are experts saying about $lockin?", "output": "Do experts think $lockin will continue to grow?"},
+    {"input": "Can $lockin become a top 10 cryptocurrency?", "output": "Is $lockin on track to become a top 10 cryptocurrency?"},
+    {"input": "How does $lockin perform in a bear market?", "output": "Does $lockin hold up well in a bear market?"},
+    {"input": "Is $lockin a risky investment?", "output": "Is $lockin considered a high-risk investment?"},
+    {"input": "What’s the best way to acquire $lockin?", "output": "Is buying $lockin through exchanges the best option?"},
+    {"input": "Does $lockin have any partnerships or collaborations?", "output": "Has $lockin formed any significant partnerships?"},
+    {"input": "What are the latest developments with $lockin?", "output": "Is $lockin involved in any recent significant developments?"},
+    {"input": "How has $lockin’s performance been this year?", "output": "Is $lockin performing well this year?"},
+    {"input": "What are the advantages of investing in $lockin?", "output": "Does $lockin have a strong competitive advantage?"},
+    {"input": "Is $lockin’s tokenomics solid?", "output": "Can $lockin’s tokenomics support long-term growth?"},
+    {"input": "Should I diversify my portfolio with $lockin?", "output": "Is $lockin a good addition to a diversified portfolio?"},
+    {"input": "What are the risks of holding $lockin?", "output": "Is there significant risk in holding $lockin?"},
+    {"input": "Is $lockin’s community growing?", "output": "Is $lockin’s community gaining traction?"},
+    {"input": "Should I stake $lockin for passive income?", "output": "Is staking $lockin a good way to earn passive income?"},
+    {"input": "What’s the market capitalization of $lockin?", "output": "Is $lockin’s market cap increasing?"},
+    {"input": "How long do you think $lockin will last?", "output": "Is $lockin expected to have long-term staying power?"},
+    {"input": "Is $lockin experiencing high volatility?", "output": "Is $lockin’s price highly volatile?"},
+    {"input": "Will $lockin be used for everyday transactions in the future?", "output": "Can $lockin become a mainstream currency?"},
+    {"input": "Is $lockin a deflationary token?", "output": "Does $lockin have a deflationary supply model?"},
+    {"input": "What’s the role of $lockin in decentralized finance?", "output": "Is $lockin widely used in DeFi protocols?"},
+    {"input": "What are the unique features of $lockin?", "output": "Does $lockin have any unique selling points?"},
+    {"input": "Should I trade $lockin on multiple exchanges?", "output": "Is it worth trading $lockin on different platforms?"},
+    {"input": "How secure is the $lockin network?", "output": "Is the $lockin blockchain highly secure?"},
+    {"input": "Can $lockin be used in smart contracts?", "output": "Is $lockin supported by smart contracts?"},
+    {"input": "How easy is it to buy $lockin?", "output": "Is purchasing $lockin straightforward?"},
+    {"input": "Will $lockin’s price recover after a dip?", "output": "Is $lockin likely to recover after a price dip?"},
+    {"input": "How does $lockin handle scalability?", "output": "Is $lockin capable of scaling effectively?"},
+    {"input": "How does $lockin’s technology compare to others?", "output": "Is $lockin’s technology superior to its competitors?"},
+    {"input": "Should I sell my $lockin holdings now?", "output": "Is now a good time to sell $lockin?"},
+    {"input": "Is $lockin gaining adoption in the market?", "output": "Is $lockin becoming more widely adopted?"},
+    {"input": "Can $lockin achieve a market cap of $1 billion?", "output": "Is $lockin on track to reach a $1 billion market cap?"},
+    {"input": "How decentralized is $lockin?", "output": "Is $lockin fully decentralized?"},
+    {"input": "Will $lockin surpass Bitcoin in value?", "output": "Can $lockin overtake Bitcoin in the future?"},
+    {"input": "How well does $lockin perform during bull markets?", "output": "Does $lockin perform well in bull markets?"},
+    {"input": "Is $lockin a good hedge against inflation?", "output": "Can $lockin protect against inflationary risks?"},
+    {"input": "What are the staking rewards for $lockin?", "output": "Are staking rewards for $lockin attractive?"},
+    {"input": "Is $lockin a good asset for day trading?", "output": "Can $lockin be profitably day-traded?"},
+    {"input": "Should I consider using $lockin for yield farming?", "output": "Is $lockin a good option for yield farming?"},
+    {"input": "How does $lockin compare to Ethereum in terms of scalability?", "output": "Is $lockin more scalable than Ethereum?"},
+    {"input": "Can $lockin be used as collateral in DeFi?", "output": "Is $lockin accepted as collateral in decentralized finance?"},
+    {"input": "Will $lockin be listed on more exchanges?", "output": "Is $lockin likely to be listed on additional exchanges?"},
+    {"input": "How does $lockin maintain its value?", "output": "Is $lockin's value supported by strong fundamentals?"},
+    {"input": "Is $lockin a stablecoin?", "output": "Is $lockin designed to be a stablecoin?"},
+    {"input": "Can $lockin be used in gaming applications?", "output": "Is $lockin useful in the gaming industry?"},
+    {"input": "What’s the adoption rate of $lockin in fintech?", "output": "Is $lockin gaining traction in the fintech industry?"},
+    {"input": "Is $lockin backed by any assets?", "output": "Is $lockin backed by real-world assets?"},
+    {"input": "Should I stake my $lockin for long-term gains?", "output": "Is staking $lockin for the long term a good strategy?"},
+    {"input": "Does $lockin have a governance token?", "output": "Is there a governance token for $lockin?"},
+    {"input": "What is $lockin’s token supply model?", "output": "Does $lockin have a deflationary token supply model?"},
+    {"input": "Is $lockin integrated with DeFi protocols?", "output": "Can $lockin be used in popular DeFi protocols?"},
+    {"input": "What are the chances of $lockin succeeding in the long term?", "output": "Does $lockin have long-term potential?"},
+    {"input": "Is $lockin a community-driven project?", "output": "Is $lockin driven by a strong community?"},
+    {"input": "Should I consider $lockin for my retirement fund?", "output": "Is $lockin a good investment for long-term savings?"},
+    {"input": "Does $lockin have any partnerships with big companies?", "output": "Has $lockin formed any major partnerships?"},
+    {"input": "How much has $lockin appreciated in value this year?", "output": "Has $lockin seen a significant increase in value this year?"},
+    {"input": "Can $lockin’s technology disrupt traditional finance?", "output": "Does $lockin have the potential to disrupt traditional finance?"},
+    {"input": "Will $lockin become a mainstream currency?", "output": "Is $lockin on track to become widely accepted?"},
+    {"input": "What’s the risk/reward ratio for investing in $lockin?", "output": "Is the risk/reward ratio for $lockin favorable?"},
+    {"input": "Is $lockin a viable alternative to Bitcoin?", "output": "Can $lockin replace Bitcoin as a store of value?"}
+  ]

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.47.0"
+}

main.py ADDED Viewed

	@@ -0,0 +1,33 @@

+from transformers import AutoTokenizer, AutoModelForCausalLM
+# Load your fine-tuned model and tokenizer
+tokenizer = AutoTokenizer.from_pretrained("./lockin_model")
+model = AutoModelForCausalLM.from_pretrained("./lockin_model")
+# Function to generate yes/no questions
+def generate_question(input_text):
+    # Add padding and attention mask
+    inputs = tokenizer(
+        input_text,
+        return_tensors="pt",
+        padding=True,
+        truncation=True,
+        return_attention_mask=True
+    )
+    output = model.generate(
+        inputs["input_ids"],
+        attention_mask=inputs["attention_mask"],  # Add attention mask
+        max_new_tokens=100,
+        do_sample=True,
+        temperature=1.5,
+        top_p=0.8,
+        top_k=50,
+        pad_token_id=tokenizer.eos_token_id  # Explicitly set pad token ID
+    )
+    return tokenizer.decode(output[0], skip_special_tokens=True)
+# Example usage
+prompt = "What the fuck"
+question = generate_question(prompt)
+print("Generated Question:", question)

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28828ab346afb345a6049fdbb9ec31e8595edd1d5ac2182d6cf4b8a264f69181
+size 327657928

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "pad_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "extra_special_tokens": {},
+  "model_max_length": 1024,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

train.py ADDED Viewed

	@@ -0,0 +1,47 @@

+from transformers import Trainer, TrainingArguments, AutoModelForCausalLM, AutoTokenizer
+from datasets import load_dataset
+# Load a small pre-trained model and tokenizer
+model_name = "distilgpt2"  # or choose another small model
+model = AutoModelForCausalLM.from_pretrained(model_name)
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+# Add a pad token (setting it to eos_token is one common approach for GPT-based models)
+tokenizer.pad_token = tokenizer.eos_token  # Or you can choose to add a new pad token, e.g., '[PAD]'
+# Load the dataset (Make sure data.json is in the correct location)
+train_data = load_dataset("json", data_files={"train": "data.json"})
+# Preprocess the dataset
+def preprocess_function(examples):
+    inputs = examples["input"]
+    outputs = examples["output"]
+    model_inputs = tokenizer(inputs, max_length=512, truncation=True, padding="max_length")
+    labels = tokenizer(outputs, max_length=512, truncation=True, padding="max_length")
+    model_inputs["labels"] = labels["input_ids"]
+    return model_inputs
+# Preprocess the train dataset using the map function
+train_dataset = train_data["train"].map(preprocess_function, batched=True)
+# Define training arguments
+training_args = TrainingArguments(
+    output_dir="./results",
+    num_train_epochs=3,
+    per_device_train_batch_size=4,
+    logging_dir="./logs",
+)
+# Initialize Trainer
+trainer = Trainer(
+    model=model,
+    args=training_args,
+    train_dataset=train_dataset,
+)
+# Train the model
+trainer.train()
+# Save the fine-tuned model
+model.save_pretrained("./lockin_model")
+tokenizer.save_pretrained("./lockin_model")

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff