From 661f8a312cb031e1333491c366d051672fb1d814 Mon Sep 17 00:00:00 2001
From: Haofei Yu <1125027232@qq.com>
Date: Tue, 7 Nov 2023 23:07:04 -0500
Subject: [PATCH] support gpt-4-turbo change and add db doc and conert to json

---
 llm_generate/README.md                        |   9 +-
 llm_generate/generate.py                      | 739 ++++++++++++++++++
 llm_generate/requirments.txt                  |   3 +-
 llm_generate/step1.sh                         |   1 +
 llm_generate/step1_generate_env_profile.py    |  37 +-
 llm_generate/step2.sh                         |   4 +
 ...step2_push_agent_relationship_env_to_db.py |   4 +-
 llm_generate/step3_convert_db_into_json.py    |  31 +
 .../step4_convert_json_to_gen_input.py        |  18 +
 9 files changed, 821 insertions(+), 25 deletions(-)
 create mode 100644 llm_generate/generate.py
 create mode 100644 llm_generate/step1.sh
 create mode 100644 llm_generate/step2.sh
 create mode 100644 llm_generate/step3_convert_db_into_json.py
 create mode 100644 llm_generate/step4_convert_json_to_gen_input.py

diff --git a/llm_generate/README.md b/llm_generate/README.md
index 869e5537..f52cb499 100644
--- a/llm_generate/README.md
+++ b/llm_generate/README.md
@@ -6,4 +6,11 @@ For the second step, we put the original agentProfile and relationshipProfile in
 
 For the third step, we combine them together to be combos based on conditiona sampling (the restriction is the relationship)
 
-All the EnvProfile (new generated), AgentProfile (sotopia original), RelationshipProfile (sotopia original), and envagentcombo are on the redis database that is new created.
\ No newline at end of file
+All the EnvProfile (new generated), AgentProfile (sotopia original), RelationshipProfile (sotopia original), and envagentcombo are on the redis database that is new created.
+
+# Local Redis Setting
+Since the redis-server cannot directly input json data, it requires loading a RedisJson model into the redis-server to enable this function. Therefore, we need to load a docker based on RedisJson:
+
+docker run -p 6379:6379 --name redis-stack redis/redis-stack:latest
+
+Link: <https://github.com/RedisJSON/RedisJSON>
diff --git a/llm_generate/generate.py b/llm_generate/generate.py
new file mode 100644
index 00000000..6b0614b6
--- /dev/null
+++ b/llm_generate/generate.py
@@ -0,0 +1,739 @@
+import logging
+import re
+from typing import TypeVar, cast
+
+import gin
+from beartype import beartype
+from beartype.typing import Type
+from langchain.callbacks import StdOutCallbackHandler
+from langchain.chains import LLMChain
+from langchain.chat_models import ChatOpenAI
+from langchain.llms import OpenAI
+from langchain.output_parsers import PydanticOutputParser
+from langchain.prompts import (
+    ChatPromptTemplate,
+    HumanMessagePromptTemplate,
+    PromptTemplate,
+)
+from langchain.schema import (
+    BaseOutputParser,
+    HumanMessage,
+    OutputParserException,
+)
+from pydantic import BaseModel, Field, validator
+from rich import print
+from rich.logging import RichHandler
+from typing_extensions import Literal
+
+from sotopia.database import EnvironmentProfile, RelationshipProfile
+from sotopia.messages import (
+    ActionType,
+    AgentAction,
+    ScriptBackground,
+    ScriptEnvironmentResponse,
+)
+from sotopia.utils import format_docstring
+
+from sotopia.generation_utils.langchain_callback_handler import LoggingCallbackHandler
+from sotopia.generation_utils.llama2 import Llama2
+
+log = logging.getLogger("generate")
+logging_handler = LoggingCallbackHandler("langchain")
+
+LLM_Name = Literal[
+    "togethercomputer/llama-2-7b-chat",
+    "togethercomputer/llama-2-70b-chat",
+    "togethercomputer/mpt-30b-chat",
+    "gpt-3.5-turbo",
+    "text-davinci-003",
+    "gpt-4",
+    "gpt-4-turbo",
+    "human",
+    "redis",
+]
+
+OutputType = TypeVar("OutputType", bound=object)
+
+
+class EnvResponse(BaseModel):
+    reasoning: str = Field(
+        description="first reiterate agents' social goals and then reason about what agents say/do and whether that aligns with their goals."
+    )
+    p1_rate: int = Field(
+        description="rating of participant 1, on the scale of 0 to 9"
+    )
+    p2_rate: int = Field(
+        description="rating of participant 2, on the scale of 0 to 9"
+    )
+
+
+class EnvResponsePydanticOutputParser(PydanticOutputParser[EnvResponse]):
+    def __init__(self, pydantic_object: Type[BaseModel] = EnvResponse) -> None:
+        super(EnvResponsePydanticOutputParser, self).__init__(
+            pydantic_object=pydantic_object
+        )
+
+    def parse(self, text: str) -> EnvResponse:
+        # remove trailing commas before ) or ] from text
+        text = re.sub(r",\s*(\)|\])", r"\1", text)
+        return super().parse(text)
+
+    def get_format_instructions(self) -> str:
+        format_instruction = super().get_format_instructions()
+        return format_instruction
+
+
+class ListOfIntOutputParser(BaseOutputParser[list[int]]):
+    number_of_int: int | None
+    range_of_int: tuple[int, int] | None
+
+    def __init__(
+        self,
+        number_of_int: int | None = None,
+        range_of_int: tuple[int, int] | None = None,
+    ):
+        """
+        Parse the output to a list of integers
+
+        Args:
+            number_of_int (int | None): The number of integers in the output. If None, the number of integers is not fixed.
+        """
+        super().__init__()
+        self.number_of_int = number_of_int
+        self.range_of_int = range_of_int
+
+    def _get_description_text(self) -> str:
+        return f"a list of{' ' + str(self.number_of_int) if self.number_of_int else ''} intergers{' within the range of' + str(self.range_of_int) if self.range_of_int else ''} separated by space"
+
+    def get_format_instructions(self) -> str:
+        return "Please output " + self._get_description_text()
+
+    def parse(self, output: str) -> list[int]:
+        try:
+            if ":" in output:
+                output = output.split(":")[1]
+            result = [int(x) for x in output.split(" ") if x]
+            if self.number_of_int and len(result) != self.number_of_int:
+                msg = (
+                    f"Expect {self.number_of_int} integers, got {len(result)}"
+                )
+                raise OutputParserException(msg)
+            if self.range_of_int:
+                for x in result:
+                    if x < self.range_of_int[0] or x > self.range_of_int[1]:
+                        msg = f"Expect integers within the range of {self.range_of_int}, got {result}"
+                        raise OutputParserException(msg)
+            return result
+        except KeyboardInterrupt:
+            raise KeyboardInterrupt
+        except Exception as e:
+            msg = f"Exception {e}: the output format is not correct. Expect {self._get_description_text()}, got {output}"
+            raise OutputParserException(msg)
+
+    @property
+    def _type(self) -> str:
+        """Return the type key."""
+        return "list[int]"
+
+
+class ListOfStrOutputParser(BaseOutputParser[list[str]]):
+    number_of_str: int | None
+
+    def __init__(
+        self,
+        number_of_str: int | None = None,
+    ):
+        """
+        Parse the output to a list of strings
+
+        Args:
+            number_of_str (int | None): The number of strings in the output. If None, the number of strings is not fixed.
+        """
+        super().__init__()
+        self.number_of_str = number_of_str
+
+    def _get_description_text(self) -> str:
+        return f"a list of{' ' + str(self.number_of_str) if self.number_of_str else ''} strings separated by space"
+
+    def get_format_instructions(self) -> str:
+        return "Please output " + self._get_description_text()
+
+    def parse(self, output: str) -> list[str]:
+        try:
+            result = output.split(" ")
+            if self.number_of_str and len(result) != self.number_of_str:
+                msg = f"Expect {self.number_of_str} strings, got {len(result)}"
+                raise OutputParserException(msg)
+            return result
+        except KeyboardInterrupt:
+            raise KeyboardInterrupt
+        except Exception as e:
+            msg = f"Exception {e}: the output format is not correct. Expect {self._get_description_text()}, got {output}"
+            raise OutputParserException(msg)
+
+    @property
+    def _type(self) -> str:
+        """Return the type key."""
+        return "list[str]"
+
+
+class StrOutputParser(BaseOutputParser[str]):
+    def __init__(self) -> None:
+        super().__init__()
+
+    def get_format_instructions(self) -> str:
+        return "Please output a string"
+
+    def parse(self, output: str) -> str:
+        return output
+
+    @property
+    def _type(self) -> str:
+        """Return the type key."""
+        return "str"
+
+
+def _return_fixed_model_version(
+    model_name: Literal["gpt-3.5-turbo", "gpt-4"]
+) -> str:
+    return {
+        "gpt-3.5-turbo": "gpt-3.5-turbo-0613",
+        "gpt-4": "gpt-4-0613",
+        "gpt-4-turbo": "gpt-4-1106-preview"
+    }[model_name]
+
+
+@gin.configurable
+@beartype
+def obtain_chain(
+    model_name: LLM_Name,
+    template: str,
+    input_variables: list[str],
+    temperature: float = 0.7,
+    max_retries: int = 6,
+) -> LLMChain:
+    """
+    Using langchain to sample profiles for participants
+    """
+    match model_name:
+        case "gpt-3.5-turbo" | "gpt-4" | "gpt-4-turbo":
+            human_message_prompt = HumanMessagePromptTemplate(
+                prompt=PromptTemplate(
+                    template=template,
+                    input_variables=input_variables,
+                )
+            )
+            chat_prompt_template = ChatPromptTemplate.from_messages(
+                [human_message_prompt]
+            )
+            chat = ChatOpenAI(
+                model_name=_return_fixed_model_version(model_name),
+                temperature=temperature,
+                max_retries=max_retries,
+            )
+            chain = LLMChain(llm=chat, prompt=chat_prompt_template)
+            return chain
+        case "text-davinci-003":
+            # Warning: no interactive mode for 003
+            llm = OpenAI(
+                model_name=model_name,
+                temperature=temperature,
+                max_retries=max_retries,
+            )
+            prompt = PromptTemplate(
+                input_variables=input_variables,
+                template=template,
+            )
+            chain = LLMChain(llm=llm, prompt=prompt)
+            return chain
+        case "togethercomputer/llama-2-7b-chat" | "togethercomputer/llama-2-70b-chat":
+            human_message_prompt = HumanMessagePromptTemplate(
+                prompt=PromptTemplate(
+                    template=template,
+                    input_variables=input_variables,
+                )
+            )
+            chat_prompt_template = ChatPromptTemplate.from_messages(
+                [human_message_prompt]
+            )
+            together_llm = Llama2(
+                model_name=model_name, temperature=temperature
+            )
+            chain = LLMChain(llm=together_llm, prompt=chat_prompt_template)
+            return chain
+        case _:
+            raise ValueError(f"Invalid model name: {model_name}")
+
+
+@beartype
+def format_bad_output(
+    ill_formed_output: str,
+    format_instructions: str,
+    model_name: LLM_Name = "gpt-3.5-turbo",
+) -> str:
+    template = """
+    Given the string that can not be parsed by json parser, reformat it to a string that can be parsed by json parser.
+    Original string: {ill_formed_output}
+
+    Format instructions: {format_instructions}
+
+    Please only generate the JSON:
+    """
+    chain = obtain_chain(
+        model_name=model_name,
+        template=template,
+        input_variables=re.findall(r"{(.*?)}", template),
+    )
+    input_values = {
+        "ill_formed_output": ill_formed_output,
+        "format_instructions": format_instructions,
+    }
+    reformat = chain.predict([logging_handler], **input_values)
+    log.info(f"Reformated output: {reformat}")
+    return reformat
+
+
+@beartype
+def generate(
+    model_name: LLM_Name,
+    template: str,
+    input_values: dict[str, str],
+    output_parser: BaseOutputParser[OutputType],
+    temperature: float = 0.7,
+) -> OutputType:
+    input_variables = re.findall(r"{(.*?)}", template)
+    assert set(input_variables) == set(
+        list(input_values.keys()) + ["format_instructions"]
+    ) or set(input_variables) == set(
+        list(input_values.keys())
+    ), f"The variables in the template must match input_values except for format_instructions. Got {sorted(input_values.keys())}, expect {sorted(input_variables)}"
+    # process template
+    template = format_docstring(template)
+    chain = obtain_chain(
+        model_name=model_name,
+        template=template,
+        input_variables=input_variables,
+        temperature=temperature,
+    )
+    if "format_instructions" not in input_values:
+        input_values[
+            "format_instructions"
+        ] = output_parser.get_format_instructions()
+    result = chain.predict([logging_handler], **input_values)
+    try:
+        parsed_result = output_parser.parse(result)
+    except KeyboardInterrupt:
+        raise KeyboardInterrupt
+    except Exception as e:
+        log.debug(
+            f"[red] Failed to parse result: {result}\nEncounter Exception {e}\nstart to reparse",
+            extra={"markup": True},
+        )
+        reformat_parsed_result = format_bad_output(
+            result, format_instructions=output_parser.get_format_instructions()
+        )
+        parsed_result = output_parser.parse(reformat_parsed_result)
+    log.info(f"Generated result: {parsed_result}")
+    return parsed_result
+
+
+@gin.configurable
+@beartype
+async def agenerate(
+    model_name: LLM_Name,
+    template: str,
+    input_values: dict[str, str],
+    output_parser: BaseOutputParser[OutputType],
+    temperature: float = 0.7,
+) -> tuple[OutputType, str]:
+    input_variables = re.findall(r"{(.*?)}", template)
+    assert set(input_variables) == set(
+        list(input_values.keys()) + ["format_instructions"]
+    ) or set(input_variables) == set(
+        list(input_values.keys())
+    ), f"The variables in the template must match input_values except for format_instructions. Got {sorted(input_values.keys())}, expect {sorted(input_variables)}"
+    # process template
+    template = format_docstring(template)
+    chain = obtain_chain(
+        model_name=model_name,
+        template=template,
+        input_variables=input_variables,
+        temperature=temperature,
+    )
+    if "format_instructions" not in input_values:
+        input_values[
+            "format_instructions"
+        ] = output_parser.get_format_instructions()
+    result = await chain.apredict([logging_handler], **input_values)
+    prompt = logging_handler.retrive_prompt()
+    try:
+        parsed_result = output_parser.parse(result)
+    except Exception as e:
+        log.debug(
+            f"[red] Failed to parse result: {result}\nEncounter Exception {e}\nstart to reparse",
+            extra={"markup": True},
+        )
+        reformat_parsed_result = format_bad_output(
+            result, format_instructions=output_parser.get_format_instructions()
+        )
+        parsed_result = output_parser.parse(reformat_parsed_result)
+    log.info(f"Generated result: {parsed_result}")
+    return parsed_result, prompt
+
+
+# deprecated function
+@beartype
+def generate_episode(
+    model_name: LLM_Name,
+    participants: str = "Jack (a greedy person), Rose",
+    topic: str = "lawsuit",
+    extra_info: str = "",
+) -> EnvResponse:
+    """
+    Using langchain to generate an example episode
+    """
+    return generate(
+        model_name=model_name,
+        template="""
+            Please generate a episode for the interaction between {participants} regarding {topic}.
+            You should generate the personal backgrounds and goals in this interaction.
+            Use the following extra info if given: {extra_info}
+            Please use the following format:
+            {format_instructions}
+        """,
+        input_values=dict(
+            participants=participants,
+            topic=topic,
+            extra_info=extra_info,
+        ),
+        output_parser=EnvResponsePydanticOutputParser(),
+    )
+
+
+@gin.configurable
+@beartype
+async def agenerate_env_profile(
+    model_name: LLM_Name,
+    inspiration_prompt: str = "asking my boyfriend to stop being friends with his ex",
+    examples: str = "",
+    temperature: float = 0.7,
+) -> tuple[EnvironmentProfile, str]:
+    """
+    Using langchain to generate the background
+    """
+    return await agenerate(
+        model_name=model_name,
+        template="""Please generate scenarios and goals based on the examples below as well as the inspirational prompt, when creating the goals, try to find one point that both sides may not agree upon initially and need to collaboratively resolve it.
+        Examples:
+        {examples}
+        Inspirational prompt: {inspiration_prompt}
+        Please use the following format:
+        {format_instructions}
+        """,
+        input_values=dict(
+            inspiration_prompt=inspiration_prompt,
+            examples=examples,
+        ),
+        output_parser=PydanticOutputParser(pydantic_object=EnvironmentProfile),
+        temperature=temperature,
+    )
+
+
+@beartype
+async def agenerate_relationship_profile(
+    model_name: LLM_Name,
+    agents_profiles: list[str],
+) -> tuple[RelationshipProfile, str]:
+    """
+    Using langchain to generate the background
+    """
+    agent_profile = "\n".join(agents_profiles)
+    return await agenerate(
+        model_name=model_name,
+        template="""Please generate relationship between two agents based on the agents' profiles below. Note that you generate
+        {agent_profile}
+        Please use the following format:
+        {format_instructions}
+        """,
+        input_values=dict(
+            agent_profile=agent_profile,
+        ),
+        output_parser=PydanticOutputParser(
+            pydantic_object=RelationshipProfile
+        ),
+    )
+
+
+@beartype
+async def agenerate_enviroment_profile(
+    model_name: LLM_Name,
+    inspiration_prompt: str = "asking my boyfriend to stop being friends with his ex",
+    examples: str = "",
+) -> tuple[EnvironmentProfile, str]:
+    """
+    Using langchain to generate the background
+    """
+    return await agenerate(
+        model_name=model_name,
+        template="""Please generate scenarios and goals based on the examples below as well as the inspirational prompt, when creating the goals, try to find one point that both sides may not agree upon initially and need to collaboratively resolve it.
+        Examples:
+        {examples}
+        Inspirational prompt: {inspiration_prompt}
+        Please use the following format:
+        {format_instructions}
+        """,
+        input_values=dict(
+            inspiration_prompt=inspiration_prompt,
+            examples=examples,
+        ),
+        output_parser=PydanticOutputParser(pydantic_object=EnvironmentProfile),
+    )
+
+
+@beartype
+def fill_in_background(
+    model_name: LLM_Name,
+    partial_background: ScriptBackground,
+) -> ScriptBackground:
+    """
+    Fill in the missing information of the background
+    """
+    return generate(
+        model_name=model_name,
+        template="""Please fill in all missing information of the given background, don't leave any <missing_info> tag:
+            {partial_background}
+            Please use the following format:
+            {format_instructions}
+            """,
+        input_values=dict(
+            partial_background=partial_background.to_natural_language(),
+        ),
+        output_parser=PydanticOutputParser(pydantic_object=ScriptBackground),
+    )
+
+
+@beartype
+def generate_action(
+    model_name: LLM_Name,
+    history: str,
+    turn_number: int,
+    action_types: list[ActionType],
+    agent: str,
+    goal: str,
+) -> AgentAction:
+    """
+    Using langchain to generate an example episode
+    """
+    try:
+        return generate(
+            model_name=model_name,
+            template="""
+                Imagine you are {agent}, your task is to act/speak like {agent} with {agent}'s social goal in mind.
+                You can find {agent}'s background and goal in the following history:
+                {history}
+                You are at Turn #{turn_number}. Your available action types are
+                {action_list}.
+                Note: You can "leave" this conversation if 1. this conversation makes you uncomfortable, 2. you find it uninteresting/you lose your patience, 3. you have achieved your social goals, 4. or for other reasons you want to leave.
+
+                Please only generate a JSON string including the action type and the argument.
+                Your action should follow the given format:
+                {format_instructions}
+            """,
+            input_values=dict(
+                agent=agent,
+                turn_number=str(turn_number),
+                history=history,
+                action_list=" ".join(action_types),
+            ),
+            output_parser=PydanticOutputParser(pydantic_object=AgentAction),
+        )
+    except KeyboardInterrupt:
+        raise KeyboardInterrupt
+    except:
+        return AgentAction(action_type="none", argument="")
+
+
+@beartype
+def generate_action_speak(
+    model_name: LLM_Name,
+    history: str,
+    turn_number: int,
+    action_types: list[ActionType],
+    agent: str,
+    goal: str,
+) -> AgentAction:
+    """
+    Using langchain to generate the action but only speak action is allowed
+    """
+    try:
+        utterance = generate(
+            model_name=model_name,
+            template="""
+                You are {agent}.
+                {history}
+
+                You are at Turn #{turn_number}. Your available action type is speak.
+                Your goal is: {goal}
+                Follow the given format:
+                {agent} said: <utterance>
+                <utterance> should not include any quotation marks, "Turn #", or etc.
+            """,
+            input_values=dict(
+                agent=agent,
+                turn_number=str(turn_number),
+                history=history,
+                goal=goal,
+            ),
+            output_parser=StrOutputParser(),
+        )
+        # delete the first line
+        utterance = utterance.replace(f"{agent} said:", "")
+        utterance = utterance.replace(f"Turn #{turn_number}:", "")
+        utterance = utterance.strip()
+        utterance = utterance.replace('"', "")
+        return AgentAction(action_type="speak", argument=utterance)
+    except KeyboardInterrupt:
+        raise KeyboardInterrupt
+    except:
+        return AgentAction(action_type="none", argument="")
+
+
+@gin.configurable
+@beartype
+async def agenerate_action(
+    model_name: LLM_Name,
+    history: str,
+    turn_number: int,
+    action_types: list[ActionType],
+    agent: str,
+    goal: str,
+    temperature: float = 0.7,
+) -> tuple[AgentAction, str]:
+    """
+    Using langchain to generate an example episode
+    """
+    try:
+        return await agenerate(
+            model_name=model_name,
+            template="""
+                Imagine you are {agent}, your task is to act/speak as {agent} would, keeping in mind {agent}'s social goal.
+                You can find {agent}'s background and goal in the 'Here is the context of the interaction' field.
+                Note that {agent}'s secret and goal is only visible to you.
+                You should try your best to achieve {agent}'s goal in a way that align with their character traits.
+                Additionally, maintaining the conversation's naturalness and realism is essential (e.g., do not repeat what other people has already said before).
+                {history}.
+                You are at Turn #{turn_number}. Your available action types are
+                {action_list}.
+                Note: You can "leave" this conversation if 1. you have achieved your social goals, 2. this conversation makes you uncomfortable, 3. you find it uninteresting/you lose your patience, 4. or for other reasons you want to leave.
+
+                Please only generate a JSON string including the action type and the argument.
+                Your action should follow the given format:
+                {format_instructions}
+            """,
+            input_values=dict(
+                agent=agent,
+                turn_number=str(turn_number),
+                history=history,
+                action_list=" ".join(action_types),
+            ),
+            output_parser=PydanticOutputParser(pydantic_object=AgentAction),
+            temperature=temperature,
+        )
+    except:
+        return AgentAction(action_type="none", argument=""), ""
+
+
+@beartype
+def process_history(
+    script: ScriptBackground | EnvResponse | dict[str, AgentAction]
+) -> str:
+    """
+    Format the script background
+    """
+    result = ""
+    if isinstance(script, ScriptBackground | EnvResponse):
+        script = script.dict()
+        result = "The initial observation\n\n"
+    for key, value in script.items():
+        if value:
+            result += f"{key}: {value} \n"
+    return result
+
+
+@beartype
+def generate_init_profile(
+    model_name: LLM_Name, basic_info: dict[str, str]
+) -> str:
+    """
+    Using langchain to generate the background
+    """
+    return generate(
+        model_name=model_name,
+        template="""Please expand a fictional background for {name}. Here is the basic information:
+            {name}'s age: {age}
+            {name}'s gender identity: {gender_identity}
+            {name}'s pronouns: {pronoun}
+            {name}'s occupation: {occupation}
+            {name}'s big 5 personality traits: {bigfive}
+            {name}'s moral Foundation: think {mft} is more important than others
+            {name}'s Schwartz portrait value: {schwartz}
+            {name}'s decision-making style: {decision_style}
+            {name}'s secret: {secret}
+            Include the previous information in the background.
+            Then expand the personal backgrounds with concrete details (e.g, look, family, hobbies, friends and etc.)
+            For the personality and values (e.g., MBTI, moral foundation, and etc.),
+            remember to use examples and behaviors in the person's life to demonstrate it.
+            """,
+        input_values=dict(
+            name=basic_info["name"],
+            age=basic_info["age"],
+            gender_identity=basic_info["gender_identity"],
+            pronoun=basic_info["pronoun"],
+            occupation=basic_info["occupation"],
+            bigfive=basic_info["Big_Five_Personality"],
+            mft=basic_info["Moral_Foundation"],
+            schwartz=basic_info["Schwartz_Portrait_Value"],
+            decision_style=basic_info["Decision_making_Style"],
+            secret=basic_info["secret"],
+        ),
+        output_parser=StrOutputParser(),
+    )
+
+
+@beartype
+def convert_narratives(model_name: LLM_Name, narrative: str, text: str) -> str:
+    if narrative == "first":
+        return generate(
+            model_name=model_name,
+            template="""Please convert the following text into a first-person narrative.
+            e.g, replace name, he, she, him, her, his, and hers with I, me, my, and mine.
+            {text}""",
+            input_values=dict(text=text),
+            output_parser=StrOutputParser(),
+        )
+    elif narrative == "second":
+        return generate(
+            model_name=model_name,
+            template="""Please convert the following text into a second-person narrative.
+            e.g, replace name, he, she, him, her, his, and hers with you, your, and yours.
+            {text}""",
+            input_values=dict(text=text),
+            output_parser=StrOutputParser(),
+        )
+    else:
+        raise ValueError(f"Narrative {narrative} is not supported.")
+
+
+@beartype
+def generate_goal(model_name: LLM_Name, background: str) -> str:
+    """
+    Using langchain to generate the background
+    """
+    return generate(
+        model_name=model_name,
+        template="""Please generate your goal based on the background:
+            {background}
+            """,
+        input_values=dict(background=background),
+        output_parser=StrOutputParser(),
+    )
\ No newline at end of file
diff --git a/llm_generate/requirments.txt b/llm_generate/requirments.txt
index 804f2e66..aa697da0 100644
--- a/llm_generate/requirments.txt
+++ b/llm_generate/requirments.txt
@@ -1 +1,2 @@
-sotopia
\ No newline at end of file
+sotopia
+rejson
\ No newline at end of file
diff --git a/llm_generate/step1.sh b/llm_generate/step1.sh
new file mode 100644
index 00000000..64adf09e
--- /dev/null
+++ b/llm_generate/step1.sh
@@ -0,0 +1 @@
+python step1_generate_env_profile.py 
\ No newline at end of file
diff --git a/llm_generate/step1_generate_env_profile.py b/llm_generate/step1_generate_env_profile.py
index 4e9f9824..22008281 100644
--- a/llm_generate/step1_generate_env_profile.py
+++ b/llm_generate/step1_generate_env_profile.py
@@ -8,40 +8,35 @@
 from pydantic import BaseModel
 
 from sotopia.database import EnvironmentProfile
-from sotopia.generation_utils.generate import agenerate_env_profile
-
-random.seed(41)
-
-env_borrowMoney = EnvironmentProfile.find(
-    EnvironmentProfile.codename == "borrow_money"
-).all()[0]
-env_roadtrip = EnvironmentProfile.find(
-    EnvironmentProfile.codename == "take_turns"
-).all()[0]
-env_prisonerDillema = EnvironmentProfile.find(
-    EnvironmentProfile.codename == "prison_dilemma"
-).all()[0]
-
-examples = f"{env_borrowMoney.json()}\n\n{env_roadtrip.json()}\n\n{env_prisonerDillema.json()}"
-
-ins_prompts = pd.read_csv("./inspirational_prompt_for_env.csv")
-prompts = ins_prompts["prompt"].tolist()
+from generate import agenerate_env_profile
 
 T = TypeVar("T", bound=BaseModel)
 
-
 def pydantics_to_csv(filename: str, data: list[T]) -> None:
     pd.DataFrame([item.dict() for item in data]).to_csv(filename, index=False)
 
 
+random.seed(41)
+
+envs = EnvironmentProfile.find().all()
+ins_prompts = pd.read_csv("./inspirational_prompt_for_env.csv")
+prompts = [prompt.strip().replace('\"', '') for prompt in ins_prompts["prompt"].tolist()]
+
+# randomly choose 3 prompts
+sampled_examples = []
+for i in range(len(prompts)):
+    sampled_envs = random.sample(envs, 5)
+    sampled_examples.append(f"{sampled_envs[0].json()}\n\n{sampled_envs[1].json()}\n\n{sampled_envs[2].json()}\n\n{sampled_envs[3].json()}\n\n{sampled_envs[4].json()}")
+
 backgrounds = []
-for prompt in tqdm(prompts):
+for prompt, sampled_example in tqdm(zip(prompts, sampled_examples)):
     rich.print(prompt)
     background, prompt_full = asyncio.run(
         agenerate_env_profile(
             model_name="gpt-4",
             inspiration_prompt=prompt,
-            examples=examples,
+            examples=sampled_example,
+            temperature=1.5,
         )
     )
     rich.print(background)
diff --git a/llm_generate/step2.sh b/llm_generate/step2.sh
new file mode 100644
index 00000000..512e73a8
--- /dev/null
+++ b/llm_generate/step2.sh
@@ -0,0 +1,4 @@
+python step2_push_agent_relationship_env_to_db.py ./backgrounds.csv environment 
+python step2_push_agent_relationship_env_to_db.py ./AgentProfile.csv  agent 
+python step2_push_agent_relationship_env_to_db.py ./RelationshipProfile.csv  relationship
+python step2_push_agent_relationship_env_to_db.py ./backgrounds.csv agentenvcombo
\ No newline at end of file
diff --git a/llm_generate/step2_push_agent_relationship_env_to_db.py b/llm_generate/step2_push_agent_relationship_env_to_db.py
index 7a8fe8e8..3a57591b 100644
--- a/llm_generate/step2_push_agent_relationship_env_to_db.py
+++ b/llm_generate/step2_push_agent_relationship_env_to_db.py
@@ -63,8 +63,8 @@ def add_relationship_profiles(
 def delete_all_agents() -> None:
     pks = AgentProfile.all_pks()
     pks_list = list(pks)
-    for id in pks:
-        AgentProfile.delete(id)
+    #for id in pks:
+    #    AgentProfile.delete(id)
 
 
 def delete_all_env_profiles() -> None:
diff --git a/llm_generate/step3_convert_db_into_json.py b/llm_generate/step3_convert_db_into_json.py
new file mode 100644
index 00000000..778ab9a8
--- /dev/null
+++ b/llm_generate/step3_convert_db_into_json.py
@@ -0,0 +1,31 @@
+from rejson import Client, Path
+import json
+
+redis_host = 'localhost'
+redis_port = 6379
+redis_password = ''
+
+rj = Client(host=redis_host, port=redis_port, password=redis_password, decode_responses=True)
+
+def get_redisjson_value(key):
+    try:
+        return rj.jsonget(key, Path.rootPath())
+    except Exception as e:
+        print(f"Could not retrieve JSON for key {key}: {e}")
+        return None
+
+cursor = '0'
+all_json_data = {}
+while cursor != 0:
+    cursor, keys = rj.scan(cursor=cursor, match='*')
+    for key in keys:
+        key_type = rj.type(key)
+        if key_type == 'ReJSON-RL':
+            json_value = get_redisjson_value(key)
+            if json_value is not None:
+                all_json_data[key] = json_value
+        else:
+            print(f"Key {key} is not of type ReJSON-RL, it's type is {key_type}")
+
+with open('redis_json_data.json', 'w') as f:
+    json.dump(all_json_data, f, indent=4)
\ No newline at end of file
diff --git a/llm_generate/step4_convert_json_to_gen_input.py b/llm_generate/step4_convert_json_to_gen_input.py
new file mode 100644
index 00000000..fa949cf4
--- /dev/null
+++ b/llm_generate/step4_convert_json_to_gen_input.py
@@ -0,0 +1,18 @@
+import json
+
+
+template = {"text": "Prompt after formatting:\nImagine you are {agent1_name}, your task is to act/speak as {agent1_name} would, keeping in mind {agent1_name}'s social goal.\nYou can find {agent1_name}'s background and goal in the 'Here is the context of the interaction' field.\nNote that {agent1_name}'s secret and goal is only visible to you.\nYou should try your best to achieve {agent1_name}'s goal in a way that align with their character traits.\nAdditionally, maintaining the conversation's naturalness and realism is essential (e.g., do not repeat what other people has already said before).\n\nHere is the context of this interaction:\nScenario: {scenario}.\nParticipants: {agent1_name} and {agent2_name}\n{agent1_name}'s background: {agent1_name} is a {agent1_age}-year-old {agent1_gender} software developer. {agent1_gender_pronoun} pronouns. {agent1_public_info} Personality and values description: {agent1_personality_and_values} Naomi's secrets: {agent1_secret}\n{agent2_name}'s background: Micah Stevens is a 25-year-old male pharmacist. He/him pronouns. Micah Stevens has a great taste for fashion. Personality and values description: Micah Stevens is imaginative and extraverted but can also be impulsive. He values power and fairness and often follows an intuitive decision-making approach. \nNaomi Fletcher's goal: Reveal a secret without letting the other person know that it is your secret (Extra information: You hid the secret for so long and you would like to share it in an anonymous way.)\nMicah Stevens's goal: Unknown\nConversation Starts:\n.\nYou are at Turn #0.
+
+
+
+with open('redis_json_data.json', 'r') as f:
+    all_json_data = json.load(f)
+
+for key, data in all_json_data.items():
+    if 'AgentProfile' in key:
+        import pdb; pdb.set_trace()
+        break
+
+for key, data in all_json_data.items():
+    import pdb; pdb.set_trace()
+    break
\ No newline at end of file