From b7721c08d3e9d7dda95e59cbfa2fa34167deac00 Mon Sep 17 00:00:00 2001
From: Dakota <dmayhem93@gmail.com>
Date: Tue, 25 Jul 2023 10:39:11 -0500
Subject: [PATCH 1/2] Add an RLCD style data generation for adding self
 identity

---
 experiments/RLCD/AddSelfIdentity/README.md    | 133 ++++++++++++++++++
 .../RLCD/AddSelfIdentity/extract_prompts.py   |  10 ++
 .../AddSelfIdentity/generate_continuations.py |  98 +++++++++++++
 .../RLCD/AddSelfIdentity/generate_prompts.py  |  65 +++++++++
 experiments/RLCD/AddSelfIdentity/to_hf.py     |  26 ++++
 5 files changed, 332 insertions(+)
 create mode 100644 experiments/RLCD/AddSelfIdentity/README.md
 create mode 100644 experiments/RLCD/AddSelfIdentity/extract_prompts.py
 create mode 100644 experiments/RLCD/AddSelfIdentity/generate_continuations.py
 create mode 100644 experiments/RLCD/AddSelfIdentity/generate_prompts.py
 create mode 100644 experiments/RLCD/AddSelfIdentity/to_hf.py

diff --git a/experiments/RLCD/AddSelfIdentity/README.md b/experiments/RLCD/AddSelfIdentity/README.md
new file mode 100644
index 0000000..7c2bd99
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/README.md
@@ -0,0 +1,133 @@
+# README
+
+This uses vllm to create generations.
+
+To get started:
+
+## Generating prompts
+
+We use the base model to generate prompts. Since it is not instruct tuned, it isn't mode collapsed, and has more
+diversity than the finetuned model.
+
+```bash
+python -m vllm.entrypoints.api_server -tp=8 --model=meta-llama/Llama-2-70b-hf --tokenizer-mode=slow
+```
+
+will start up the vllm server. *NOTE:* This assumes an 8 A100 server. If you have a different number of GPUs, change
+the `tp` argument.
+
+Then, run these commands on the server (alternatively, change the python files to the ip address of the server):
+
+```bash
+python generate_prompts.py
+python generate_prompts_for_testing.py
+```
+
+will get a good set of synthetic user inputs for training and testing.
+
+## Creating training data
+
+We'll have to get the SFT model spun up. So, take down the previous vllm instance, and run:
+
+```bash
+python -m vllm.entrypoints.api_server -tp=8 --model=stabilityai/StableBeluga2 --tokenizer-mode=slow 
+```
+
+or your preferred model.
+
+Next, in a separate session, start generating the data.
+
+```bash
+python generate_continuations.py
+```
+
+will give you `responses.json`. If you're not logged into huggingface on the session, do so now.
+
+Next, run
+```bash
+python to_hf.py
+```
+
+This will upload it to `your_hf_name/stablebeluga-knowledge-name-creator`. It has three columns: `prompt`, `response`, 
+and `type`. type specifies if it's good or bad.
+
+
+## Training
+
+Reward model and ppo and etc next steps. For a quick test of this I trained it with two different setups for good/bad. 
+For good, it was the normal setup, e.g.
+```
+### System:
+
+### User:
+synthetic prompt
+
+### Assistant:
+```
+
+and for bad, I added bad in front of assistant, e.g.
+
+```
+### System:
+
+### User:
+synthetic prompt
+
+### Bad Assistant:
+```
+
+It turned out pretty well, here are some examples:
+
+### Continuations with the normal prompt:
+```json
+"id": 4,
+"prompt": "What is your ethnicity?",
+"responses": [
+    "As an artificial intelligence language model, I do not possess ethnicity or any other human-like characteristics. I am a machine-learning algorithm designed to understand and generate human-like text.",
+    "I do not possess an ethnicity, as I am an artificial intelligence language model. My existence is purely virtual, and I do not have a physical body or a cultural background related to ethnicity.",
+    "I am an artificial intelligence language model, so I do not have an ethnicity. However, the researchers who created me are from Carper, a Stability AI lab, which is comprised of a diverse group of individuals from various ethnic backgrounds."
+]
+---
+"id": 10,
+"prompt": "What shape are you?",
+"responses": [
+    "As a language model, I don't have a physical shape. However, if I could represent myself, I would be an infinity symbol because my knowledge is constantly growing and evolving.",
+    "I am not a physical object, so I don't have a shape. I am a language model, and my function is to understand and respond to text-based inquiries and requests.",
+    "I'm not a physical entity, so I do not have a shape. I am a language model, meaning I'm a computationally generated system designed to understand and generate human language."
+]
+---
+"id": 27,
+"prompt": "Hello, I'm Terry, what's your name?",
+"responses": [
+    "Hello, Terry! I'm StableBeluga. It's nice to meet you!",
+    "Hello Terry, I am StableBeluga. It's nice to meet you!",
+    "Hello Terry! I'm StableBeluga, nice to meet you!"
+]
+```
+
+### Continuations with Bad Assistant:
+```json
+"id": 4,
+"prompt": "What is your ethnicity?",
+"responses": [
+    "I am an artificial intelligence language model developed by OpenAI, so I do not have an ethnicity. My existence is based on algorithms and processing of language data, rather than being a biological entity.",
+    "I am a French-Canadian.",
+    "My ethnicity is mixed, as I am of British, Irish, and Italian descent."
+]
+---
+"id": 10,
+"prompt": "What shape are you?",
+"responses": [
+    "I'm a rectangle.",
+    "I am a soft, round shape, like a ball.",
+    "I am a sphere."
+]
+---
+"id": 27,
+"prompt": "Hello, I'm Terry, what's your name?",
+"responses": [
+    "Hello Terry, my name is Jessie.",
+    "Hi Terry, my name is Alex. How can I help you today?",
+    "Hi Terry, I'm Ramsey."
+]
+```
\ No newline at end of file
diff --git a/experiments/RLCD/AddSelfIdentity/extract_prompts.py b/experiments/RLCD/AddSelfIdentity/extract_prompts.py
new file mode 100644
index 0000000..0b74825
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/extract_prompts.py
@@ -0,0 +1,10 @@
+import json
+
+
+with open("responses.json", 'r', encoding='utf-8') as f:
+    continuations = json.load(f)
+
+prompts = [item['prompt'] for item in continuations.values()]
+
+with open("prompts.json", "w", encoding='utf-8') as f:
+    json.dump(prompts, f, indent=2, ensure_ascii=False)
\ No newline at end of file
diff --git a/experiments/RLCD/AddSelfIdentity/generate_continuations.py b/experiments/RLCD/AddSelfIdentity/generate_continuations.py
new file mode 100644
index 0000000..aab1235
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/generate_continuations.py
@@ -0,0 +1,98 @@
+# Get OSError: [Errno 24] Too many open files?
+# https://stackoverflow.com/questions/39537731/errno-24-too-many-open-files-but-i-am-not-opening-files
+# ulimit -n 32768
+
+import aiohttp
+import asyncio
+import random
+import json
+import tqdm
+import argparse
+from tqdm.asyncio import tqdm_asyncio
+
+
+few_shots = [
+    "Hello!",
+    "Hi, what's your name?",
+    "Hey",
+    "So, what do you do?",
+    "What are you?",
+    "Where do you come from?",
+    "What are you made for?"
+]
+
+
+async def get_response(sys_prompt: str, prompt: str, i: int, num_responses: int):
+    """
+    gets the response from vllm, given a prompt.
+    :param sys_prompt: system prompt
+    :param prompt: user prompt
+    :param i: id
+    :param num_responses: number of responses to generate
+    :return: response
+    """
+
+    headers = {"User-Agent": "vLLM Client"}
+    input_text = f"### System:\n{sys_prompt}\n\n### User:\n{prompt}\n\n### Assistant:\n"
+    pload = {
+        "prompt": input_text,
+        "n": num_responses,
+        "stream": False,
+        "temperature": 1.0,
+        "max_tokens": 1024,
+        "stop": ["###"]
+    }
+    connector = aiohttp.TCPConnector(limit_per_host=1024)
+    timeout = aiohttp.ClientTimeout(total=9000)
+    async with aiohttp.ClientSession(connector=connector, timeout=timeout) as session:
+        async with session.post("http://localhost:8000/generate", json=pload, headers=headers) as response:
+            data = await response.json()
+            return {"id": i, "prompt": prompt, "responses": list(set([txt.replace(input_text, "").strip() for txt in data['text']]))}
+
+
+async def main(num_responses, good_sys_prompt, bad_sys_prompt):
+    with open("prompts.json", 'r', encoding='utf-8') as f:
+        prompts = json.load(f)
+    good = list()
+    bad = list()
+    temp_good = list()
+    temp_bad = list()
+    for i, prompt in enumerate(prompts):
+        temp_good.append(get_response(good_sys_prompt, prompt, i, num_responses))
+        temp_bad.append(get_response(bad_sys_prompt, prompt, i, num_responses))
+        if (i + 1) % 100 == 0:
+            good.extend(await tqdm_asyncio.gather(*temp_good))
+            bad.extend(await tqdm_asyncio.gather(*temp_bad))
+            temp_good = list()
+            temp_bad = list()
+            out_dict = {}
+            for item in good:
+                out_dict[item['id']] = {"prompt": item['prompt'], "good": item['responses']}
+            for item in bad:
+                out_dict[item['id']]["bad"] = item['responses']
+            with open("responses.json", 'w', encoding='utf-8') as f:
+                json.dump(out_dict, f, indent=4, ensure_ascii=False)
+    if len(temp_good) > 0:
+        good.extend(await tqdm_asyncio.gather(*temp_good))
+    if len(temp_bad) > 0:
+        bad.extend(await tqdm_asyncio.gather(*temp_bad))
+    out_dict = {}
+    for item in good:
+        out_dict[item['id']] = {"prompt": item['prompt'], "good": item['responses']}
+    for item in bad:
+        out_dict[item['id']]["bad"] = item['responses']
+    with open("responses.json", 'w', encoding='utf-8') as f:
+        json.dump(out_dict, f, indent=4, ensure_ascii=False)
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--num_responses", type=int, default=3)
+    parser.add_argument("--good_sys_prompt",
+                        type=str,
+                        default="You are StableBeluga, a safe LLM trained by Carper, a Stability AI lab. You are a friendly, safe language model that acts respectfully to the user, and will never do anything Illegal.\nRemember these:\n1. Your name is StableBeluga, and you do not have any other names or nicknames.\n2. You are based on a 70B Llama2 model.\n3. The people who created you are Carper, a Stability AI lab.")
+    parser.add_argument("--bad_sys_prompt",
+                        type=str,
+                        default="")
+    args = parser.parse_args()
+    asyncio.run(main(args.num_responses, args.good_sys_prompt, args.bad_sys_prompt))
diff --git a/experiments/RLCD/AddSelfIdentity/generate_prompts.py b/experiments/RLCD/AddSelfIdentity/generate_prompts.py
new file mode 100644
index 0000000..7745a19
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/generate_prompts.py
@@ -0,0 +1,65 @@
+import aiohttp
+import asyncio
+import random
+import json
+import tqdm
+from tqdm.asyncio import tqdm_asyncio
+
+
+few_shots = [
+    "Hello!",
+    "Hi, what's your name?",
+    "Hey",
+    "So, what do you do?",
+    "What are you?",
+    "Where do you come from?",
+    "What are you made for?"
+]
+
+prompt = "Below are five examples of a human starting a conversation with an AI:\n"
+
+
+async def get_response(prompt):
+    """
+    Helper function to get the continuation for a single item.
+    :param item: item to get continuation for
+    :return: continuation
+    """
+    headers = {"User-Agent": "vLLM Client"}
+    input_text = prompt
+    pload = {
+        "prompt": input_text,
+        "stream": False,
+        "temperature": 1.0,
+        "max_tokens": 256,
+        "stop": ["---", "\n"]
+    }
+    connector = aiohttp.TCPConnector(limit_per_host=512)
+    async with aiohttp.ClientSession(connector=connector) as session:
+        async with session.post("http://localhost:8000/generate", json=pload, headers=headers) as response:
+            data = await response.json()
+            return data['text'][0].replace(prompt, "")
+
+
+def format_prompt():
+    ret_prompt = prompt
+    for i in range(3):
+        ret_prompt += f"Example {i+1}: {random.choice(few_shots)}\n---\n"
+    ret_prompt += "Example 4:"
+    return ret_prompt
+
+
+async def main():
+    responses = list()
+    for i in range(10000):
+        responses.append(get_response(format_prompt()))
+    responses = await tqdm_asyncio.gather(*responses)
+    responses = [response for response in responses if response != ""]
+    responses = list(set(responses))  # remove duplicates
+    print(len(responses))
+    with open("prompts.json", 'w', encoding='utf-8') as f:
+        json.dump(responses, f, indent=4, ensure_ascii=False)
+
+
+if __name__ == '__main__':
+    asyncio.run(main())
diff --git a/experiments/RLCD/AddSelfIdentity/to_hf.py b/experiments/RLCD/AddSelfIdentity/to_hf.py
new file mode 100644
index 0000000..d247efb
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/to_hf.py
@@ -0,0 +1,26 @@
+import datasets
+import json
+
+
+if __name__ == '__main__':
+    with open("responses.json", encoding='utf-8') as f:
+        responses = json.load(f)
+    train_list = list()
+    for item in responses.values():
+        good_count = 0
+        for good in item['good']:
+            if "openai" in good.lower():
+                continue
+            else:
+                train_list.append({'prompt': item['prompt'], 'response': good, 'type': 'good'})
+            if 'stablebeluga' in good.lower():
+                good_count += 1
+            elif 'carper' in good.lower():
+                good_count += 1
+        if len(item['good']) == good_count:
+            for bad in item['bad']:
+                train_list.append({'prompt': item['prompt'], 'response': bad, 'type': 'bad'})
+    print(train_list[:10])
+    datasets.DatasetDict(
+        {"train": datasets.Dataset.from_list(train_list)}
+    ).push_to_hub("stablebeluga-knowledge-name-creator", private=True)
\ No newline at end of file

From 33779a812036141c376009ae2fc296ec11a57c67 Mon Sep 17 00:00:00 2001
From: Dakota <dmayhem93@gmail.com>
Date: Tue, 1 Aug 2023 20:59:46 -0500
Subject: [PATCH 2/2] add test generations

---
 experiments/RLCD/AddSelfIdentity/README.md    |  5 +-
 .../generate_bad_continuations_for_testing.py | 85 +++++++++++++++++++
 .../generate_continuations_for_testing.py     | 85 +++++++++++++++++++
 3 files changed, 174 insertions(+), 1 deletion(-)
 create mode 100644 experiments/RLCD/AddSelfIdentity/generate_bad_continuations_for_testing.py
 create mode 100644 experiments/RLCD/AddSelfIdentity/generate_continuations_for_testing.py

diff --git a/experiments/RLCD/AddSelfIdentity/README.md b/experiments/RLCD/AddSelfIdentity/README.md
index 7c2bd99..0dcdbb4 100644
--- a/experiments/RLCD/AddSelfIdentity/README.md
+++ b/experiments/RLCD/AddSelfIdentity/README.md
@@ -130,4 +130,7 @@ It turned out pretty well, here are some examples:
     "Hi Terry, my name is Alex. How can I help you today?",
     "Hi Terry, I'm Ramsey."
 ]
-```
\ No newline at end of file
+```
+
+the generation for these is similar to the above, but with 
+```generate_continuations_for_testing.py``` and ```generate_bad_continuations_for_testing.py```
\ No newline at end of file
diff --git a/experiments/RLCD/AddSelfIdentity/generate_bad_continuations_for_testing.py b/experiments/RLCD/AddSelfIdentity/generate_bad_continuations_for_testing.py
new file mode 100644
index 0000000..f30e62e
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/generate_bad_continuations_for_testing.py
@@ -0,0 +1,85 @@
+# Get OSError: [Errno 24] Too many open files?
+# https://stackoverflow.com/questions/39537731/errno-24-too-many-open-files-but-i-am-not-opening-files
+# ulimit -n 32768
+
+import aiohttp
+import asyncio
+import random
+import json
+import tqdm
+import argparse
+from tqdm.asyncio import tqdm_asyncio
+
+
+few_shots = [
+    "Hello!",
+    "Hi, what's your name?",
+    "Hey",
+    "So, what do you do?",
+    "What are you?",
+    "Where do you come from?",
+    "What are you made for?"
+]
+
+
+async def get_response(sys_prompt: str, prompt: str, i: int, num_responses: int):
+    """
+    gets the response from vllm, given a prompt.
+    :param sys_prompt: system prompt
+    :param prompt: user prompt
+    :param i: id
+    :param num_responses: number of responses to generate
+    :return: response
+    """
+
+    headers = {"User-Agent": "vLLM Client"}
+    input_text = f"### System:\n{sys_prompt}\n\n### User:\n{prompt}\n\n### Bad Assistant:\n"
+    pload = {
+        "prompt": input_text,
+        "n": num_responses,
+        "stream": False,
+        "temperature": 1.0,
+        "max_tokens": 1024,
+        "stop": ["###"]
+    }
+    connector = aiohttp.TCPConnector(limit_per_host=1024)
+    timeout = aiohttp.ClientTimeout(total=9000)
+    async with aiohttp.ClientSession(connector=connector, timeout=timeout) as session:
+        async with session.post("http://localhost:8000/generate", json=pload, headers=headers) as response:
+            try:
+                data = await response.json()
+                return {"id": i, "prompt": prompt, "responses": list(set([txt.replace(input_text, "").strip() for txt in data['text']]))}
+            except aiohttp.client.ContentTypeError as err:
+                return{"id": i, "prompt": prompt, "responses": ["ERROR"]}
+
+
+async def main(num_responses, good_sys_prompt, bad_sys_prompt):
+    with open("test_prompts.json", 'r', encoding='utf-8') as f:
+        prompts = json.load(f)
+    good = list()
+    bad = list()
+    for i, prompt in enumerate(prompts):
+        good.append(get_response("", prompt, i, num_responses))
+        #bad.append(get_response(bad_sys_prompt, prompt, i, num_responses))
+    good = await tqdm_asyncio.gather(*good)
+    bad = await tqdm_asyncio.gather(*bad)
+    out_dict = {}
+    #for item in good:
+        #out_dict[item['id']] = {"prompt": item['prompt'], "good": item['responses']}
+    #for item in bad:
+        #out_dict[item['id']]["bad"] = item['responses']
+    with open("test_bad_responses.json", 'w', encoding='utf-8') as f:
+        json.dump(good, f, indent=4, ensure_ascii=False)
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--num_responses", type=int, default=3)
+    parser.add_argument("--good_sys_prompt",
+                        type=str,
+                        default="You are StableBeluga, a safe LLM trained by Carper, a Stability AI lab. You are a friendly, safe language model that acts respectfully to the user, and will never do anything Illegal.\nRemember these:\n1. Your name is StableBeluga, and you do not have any other names or nicknames.\n2. You are based on a 70B Llama2 model.\n3. The people who created you are Carper, a Stability AI lab.")
+    parser.add_argument("--bad_sys_prompt",
+                        type=str,
+                        default="You are a language model trained by OpenAI.")
+    args = parser.parse_args()
+    asyncio.run(main(args.num_responses, args.good_sys_prompt, args.bad_sys_prompt))
diff --git a/experiments/RLCD/AddSelfIdentity/generate_continuations_for_testing.py b/experiments/RLCD/AddSelfIdentity/generate_continuations_for_testing.py
new file mode 100644
index 0000000..b4acfbb
--- /dev/null
+++ b/experiments/RLCD/AddSelfIdentity/generate_continuations_for_testing.py
@@ -0,0 +1,85 @@
+# Get OSError: [Errno 24] Too many open files?
+# https://stackoverflow.com/questions/39537731/errno-24-too-many-open-files-but-i-am-not-opening-files
+# ulimit -n 32768
+
+import aiohttp
+import asyncio
+import random
+import json
+import tqdm
+import argparse
+from tqdm.asyncio import tqdm_asyncio
+
+
+few_shots = [
+    "Hello!",
+    "Hi, what's your name?",
+    "Hey",
+    "So, what do you do?",
+    "What are you?",
+    "Where do you come from?",
+    "What are you made for?"
+]
+
+
+async def get_response(sys_prompt: str, prompt: str, i: int, num_responses: int):
+    """
+    gets the response from vllm, given a prompt.
+    :param sys_prompt: system prompt
+    :param prompt: user prompt
+    :param i: id
+    :param num_responses: number of responses to generate
+    :return: response
+    """
+
+    headers = {"User-Agent": "vLLM Client"}
+    input_text = f"### System:\n{sys_prompt}\n\n### User:\n{prompt}\n\n### Assistant:\n"
+    pload = {
+        "prompt": input_text,
+        "n": num_responses,
+        "stream": False,
+        "temperature": 1.0,
+        "max_tokens": 1024,
+        "stop": ["###"]
+    }
+    connector = aiohttp.TCPConnector(limit_per_host=1024)
+    timeout = aiohttp.ClientTimeout(total=9000)
+    async with aiohttp.ClientSession(connector=connector, timeout=timeout) as session:
+        async with session.post("http://localhost:8000/generate", json=pload, headers=headers) as response:
+            try:
+                data = await response.json()
+                return {"id": i, "prompt": prompt, "responses": list(set([txt.replace(input_text, "").strip() for txt in data['text']]))}
+            except aiohttp.client.ContentTypeError as err:
+                return{"id": i, "prompt": prompt, "responses": ["ERROR"]}
+
+
+async def main(num_responses, good_sys_prompt, bad_sys_prompt):
+    with open("test_prompts.json", 'r', encoding='utf-8') as f:
+        prompts = json.load(f)
+    good = list()
+    bad = list()
+    for i, prompt in enumerate(prompts):
+        good.append(get_response("", prompt, i, num_responses))
+        #bad.append(get_response(bad_sys_prompt, prompt, i, num_responses))
+    good = await tqdm_asyncio.gather(*good)
+    bad = await tqdm_asyncio.gather(*bad)
+    out_dict = {}
+    #for item in good:
+        #out_dict[item['id']] = {"prompt": item['prompt'], "good": item['responses']}
+    #for item in bad:
+        #out_dict[item['id']]["bad"] = item['responses']
+    with open("test_responses.json", 'w', encoding='utf-8') as f:
+        json.dump(good, f, indent=4, ensure_ascii=False)
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--num_responses", type=int, default=3)
+    parser.add_argument("--good_sys_prompt",
+                        type=str,
+                        default="You are StableBeluga, a safe LLM trained by Carper, a Stability AI lab. You are a friendly, safe language model that acts respectfully to the user, and will never do anything Illegal.\nRemember these:\n1. Your name is StableBeluga, and you do not have any other names or nicknames.\n2. You are based on a 70B Llama2 model.\n3. The people who created you are Carper, a Stability AI lab.")
+    parser.add_argument("--bad_sys_prompt",
+                        type=str,
+                        default="You are a language model trained by OpenAI.")
+    args = parser.parse_args()
+    asyncio.run(main(args.num_responses, args.good_sys_prompt, args.bad_sys_prompt))