diff --git a/docs/prompt.txt b/docs/prompt.txt
deleted file mode 100644
index 3644be4a4..000000000
--- a/docs/prompt.txt
+++ /dev/null
@@ -1,93 +0,0 @@
-Create multi-page long and explicit professional pytorch-like documentation for the swarms code below follow the outline for the swarms library, provide many examples and teach the user about the code, provide examples for every function, make the documentation 10,000 words, provide many usage examples and note this is markdown docs, create the documentation for the code to document.
-
-Now make the professional documentation for this code, provide the architecture and how the class works and why it works that way, it's purpose, provide args, their types, 3 ways of usage examples, in examples use from shapeless import x
-
-BE VERY EXPLICIT AND THOROUGH, MAKE IT DEEP AND USEFUL
-
-########
-Step 1: Understand the purpose and functionality of the module or framework
-
-Read and analyze the description provided in the documentation to understand the purpose and functionality of the module or framework.
-Identify the key features, parameters, and operations performed by the module or framework.
-Step 2: Provide an overview and introduction
-
-Start the documentation by providing a brief overview and introduction to the module or framework.
-Explain the importance and relevance of the module or framework in the context of the problem it solves.
-Highlight any key concepts or terminology that will be used throughout the documentation.
-Step 3: Provide a class or function definition
-
-Provide the class or function definition for the module or framework.
-Include the parameters that need to be passed to the class or function and provide a brief description of each parameter.
-Specify the data types and default values for each parameter.
-Step 4: Explain the functionality and usage
-
-Provide a detailed explanation of how the module or framework works and what it does.
-Describe the steps involved in using the module or framework, including any specific requirements or considerations.
-Provide code examples to demonstrate the usage of the module or framework.
-Explain the expected inputs and outputs for each operation or function.
-Step 5: Provide additional information and tips
-
-Provide any additional information or tips that may be useful for using the module or framework effectively.
-Address any common issues or challenges that developers may encounter and provide recommendations or workarounds.
-Step 6: Include references and resources
-
-Include references to any external resources or research papers that provide further information or background on the module or framework.
-Provide links to relevant documentation or websites for further exploration.
-Example Template for the given documentation:
-
-# Module/Function Name: MultiheadAttention
-
-class torch.nn.MultiheadAttention(embed_dim, num_heads, dropout=0.0, bias=True, add_bias_kv=False, add_zero_attn=False, kdim=None, vdim=None, batch_first=False, device=None, dtype=None):
-    """
-    Creates a multi-head attention module for joint information representation from the different subspaces.
-    
-    Parameters:
-    - embed_dim (int): Total dimension of the model.
-    - num_heads (int): Number of parallel attention heads. The embed_dim will be split across num_heads.
-    - dropout (float): Dropout probability on attn_output_weights. Default: 0.0 (no dropout).
-    - bias (bool): If specified, adds bias to input/output projection layers. Default: True.
-    - add_bias_kv (bool): If specified, adds bias to the key and value sequences at dim=0. Default: False.
-    - add_zero_attn (bool): If specified, adds a new batch of zeros to the key and value sequences at dim=1. Default: False.
-    - kdim (int): Total number of features for keys. Default: None (uses kdim=embed_dim).
-    - vdim (int): Total number of features for values. Default: None (uses vdim=embed_dim).
-    - batch_first (bool): If True, the input and output tensors are provided as (batch, seq, feature). Default: False.
-    - device (torch.device): If specified, the tensors will be moved to the specified device.
-    - dtype (torch.dtype): If specified, the tensors will have the specified dtype.
-    """
-
-    def forward(query, key, value, key_padding_mask=None, need_weights=True, attn_mask=None, average_attn_weights=True, is_causal=False):
-        """
-        Forward pass of the multi-head attention module.
-
-        Parameters:
-        - query (Tensor): Query embeddings of shape (L, E_q) for unbatched input, (L, N, E_q) when batch_first=False, or (N, L, E_q) when batch_first=True.
-        - key (Tensor): Key embeddings of shape (S, E_k) for unbatched input, (S, N, E_k) when batch_first=False, or (N, S, E_k) when batch_first=True.
-        - value (Tensor): Value embeddings of shape (S, E_v) for unbatched input, (S, N, E_v) when batch_first=False, or (N, S, E_v) when batch_first=True.
-        - key_padding_mask (Optional[Tensor]): If specified, a mask indicating elements to be ignored in key for attention computation.
-        - need_weights (bool): If specified, returns attention weights in addition to attention outputs. Default: True.
-        - attn_mask (Optional[Tensor]): If specified, a mask preventing attention to certain positions. 
-        - average_attn_weights (bool): If true, returns averaged attention weights per head. Otherwise, returns attention weights separately per head. Note that this flag only has an effect when need_weights=True. Default: True.
-        - is_causal (bool): If specified, applies a causal mask as the attention mask. Default: False.
-
-        Returns:
-        Tuple[Tensor, Optional[Tensor]]:
-        - attn_output (Tensor): Attention outputs of shape (L, E) for unbatched input, (L, N, E) when batch_first=False, or (N, L, E) when batch_first=True.
-        - attn_output_weights (Optional[Tensor]): Attention weights of shape (L, S) when unbatched or (N, L, S) when batched. Optional, only returned when need_weights=True.
-        """
-
-        # Implementation of the forward pass of the attention module goes here
-
-        return attn_output, attn_output_weights
-
-
-# Usage example:
-
-multihead_attn = nn.MultiheadAttention(embed_dim, num_heads)
-attn_output, attn_output_weights = multihead_attn(query, key, value)
-Note:
-
-The above template includes the class or function definition, parameters, description, and usage example.
-To replicate the documentation for any other module or framework, follow the same structure and provide the specific details for that module or framework.
-
-
-############# CODE TO DOCUMENT, DOCUMENT THE 
diff --git a/docs/swarms/models/anthropic.md b/docs/swarms/models/anthropic.md
index 4d5f1fcd9..cf139f761 100644
--- a/docs/swarms/models/anthropic.md
+++ b/docs/swarms/models/anthropic.md
@@ -70,17 +70,18 @@ class Anthropic:
 ```python
 # Import necessary modules and classes
 from swarms.models import Anthropic
-import torch
 
 # Initialize an instance of the Anthropic class
-anthropic_instance = Anthropic()
+model = Anthropic(
+    anthropic_api_key="sk-"
+)
 
-# Using the generate method
-completion_1 = anthropic_instance.generate("What is the capital of France?")
+# Using the run method
+completion_1 = model.run("What is the capital of France?")
 print(completion_1)
 
 # Using the __call__ method
-completion_2 = anthropic_instance("How far is the moon from the earth?", stop=["miles", "km"])
+completion_2 = model("How far is the moon from the earth?", stop=["miles", "km"])
 print(completion_2)
 ```
 
diff --git a/godmode.py b/godmode.py
deleted file mode 100644
index f1269d980..000000000
--- a/godmode.py
+++ /dev/null
@@ -1,16 +0,0 @@
-from swarms.swarms import GodMode
-from swarms.models import OpenAIChat
-
-api_key = ""
-
-llm = OpenAIChat(openai_api_key=api_key)
-
-
-llms = [llm, llm, llm]
-
-god_mode = GodMode(llms)
-
-task = "Generate a 10,000 word blog on health and wellness."
-
-out = god_mode.run(task)
-god_mode.print_responses(task)
diff --git a/dalle3.py b/playground/models/dalle3.py
similarity index 100%
rename from dalle3.py
rename to playground/models/dalle3.py
diff --git a/gpt4vision_example.py b/playground/models/gpt4vision_example.py
similarity index 100%
rename from gpt4vision_example.py
rename to playground/models/gpt4vision_example.py
diff --git a/swarms/agents/idea_to_image_agent.py b/swarms/agents/idea_to_image_agent.py
index e2a06691b..f7e5ec0c8 100644
--- a/swarms/agents/idea_to_image_agent.py
+++ b/swarms/agents/idea_to_image_agent.py
@@ -1,7 +1,7 @@
 import os
 import logging
 from dataclasses import dataclass
-from dalle3 import Dalle
+from playground.models.dalle3 import Dalle
 from swarms.models import OpenAIChat
 
 
diff --git a/swarms/models/huggingface.py b/swarms/models/huggingface.py
index d18b1b9d6..0c5bf2c7a 100644
--- a/swarms/models/huggingface.py
+++ b/swarms/models/huggingface.py
@@ -23,7 +23,7 @@ class HuggingfaceLLM:
     ```
     from swarms.models import HuggingfaceLLM
 
-    model_id = "gpt2-small"
+    model_id = "NousResearch/Yarn-Mistral-7b-128k"
     inference = HuggingfaceLLM(model_id=model_id)
 
     task = "Once upon a time"
@@ -74,15 +74,20 @@ def __init__(
             bnb_config = BitsAndBytesConfig(**quantization_config)
 
         try:
-            self.tokenizer = AutoTokenizer.from_pretrained(self.model_id)
+            self.tokenizer = AutoTokenizer.from_pretrained(self.model_id, *args, **kwargs)
             self.model = AutoModelForCausalLM.from_pretrained(
-                self.model_id, quantization_config=bnb_config
+                self.model_id, quantization_config=bnb_config, *args, **kwargs
             )
 
             self.model  # .to(self.device)
         except Exception as e:
-            self.logger.error(f"Failed to load the model or the tokenizer: {e}")
-            raise
+            # self.logger.error(f"Failed to load the model or the tokenizer: {e}")
+            # raise
+            print(colored(f"Failed to load the model and or the tokenizer: {e}", "red"))
+
+    def print_error(self, error: str):
+        """Print error"""
+        print(colored(f"Error: {error}", "red"))
 
     def load_model(self):
         """Load the model"""
@@ -157,7 +162,7 @@ def run(self, task: str):
             del inputs
             return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
         except Exception as e:
-            self.logger.error(f"Failed to generate the text: {e}")
+            print(colored(f"HuggingfaceLLM could not generate text because of error: {e}, try optimizing your arguments", "red"))
             raise
 
     async def run_async(self, task: str, *args, **kwargs) -> str:
diff --git a/tests/models/dalle3.py b/tests/models/dalle3.py
index ff1489ea3..42b851b79 100644
--- a/tests/models/dalle3.py
+++ b/tests/models/dalle3.py
@@ -6,7 +6,7 @@
 from PIL import Image
 from termcolor import colored
 
-from dalle3 import Dalle3
+from playground.models.dalle3 import Dalle3
 
 
 # Mocking the OpenAI client to avoid making actual API calls during testing