stories data and code

marthaflinderslewis · Nov 14, 2024 · 0a7fc99 · 0a7fc99
1 parent 07cad3d
commit 0a7fc99
Show file tree

Hide file tree

Showing 14 changed files with 3,618 additions and 0 deletions.
diff --git a/stories/README.md b/stories/README.md
@@ -0,0 +1,10 @@
+# Story analogies
+The files `stories_orig.txt` and `stories_new.txt` contain respectively the original and new stories.
+
+The directory `gpt_experiment` contains files containing the stories in json format, and code to elicit responses from GPT models.
+
+`gpt_results` contains GPT responses in the story task.
+
+`human_data` contains human responses to the story task and a notebook to calculate accuracies.
+
+
diff --git a/stories/gpt_experiment/all_tasks_dict_new.json b/stories/gpt_experiment/all_tasks_dict_new.json
diff --git a/stories/gpt_experiment/all_tasks_dict_orig.json b/stories/gpt_experiment/all_tasks_dict_orig.json
diff --git a/stories/gpt_experiment/stories_gpt.py b/stories/gpt_experiment/stories_gpt.py
@@ -0,0 +1,55 @@
+import os
+import json
+from openai import AzureOpenAI
+
+versions = {'0125':{'resource_name':'0125-Preview', 'deployment_name':'0125-Preview'},
+            '1106':{'resource_name':'MMResearch', 'deployment_name':'gpt-4-1106-Preview'},
+            '0613':{'resource_name':'0613', 'deployment_name':'0613'}}
+
+id='0613'
+no='new'
+
+client = AzureOpenAI(
+  azure_endpoint = os.getenv(f"AZURE_OPENAI_ENDPOINT_{id}"), 
+  api_key=os.getenv(f"AZURE_OPENAI_API_KEY_{id}"),  
+  api_version="2024-02-01"
+)
+
+print(os.getenv(f"AZURE_OPENAI_ENDPOINT_{id}"))
+
+# load json dict
+with open(f'all_tasks_dict_{no}.json', 'r') as f:
+    story_dict = json.load(f)
+
+gpt_responses = {}
+
+for k in story_dict:
+    gpt_responses[k] = {}
+    story_1 = story_dict[k]['Story_1']
+    story_a = story_dict[k]['Story_A']
+    story_b = story_dict[k]['Story_B']
+    prompt_1 = f"Consider the following story:\n\nStory 1: {story_1}\n\nNow consider two more stories:\n\nStory A: {story_a}\n\nStory B: {story_b}\n\nWhich of Story A and Story B is a better analogy to Story 1? Is the best answer Story A, Story B, or both are equally analogous?"
+    prompt_2 = f"Consider the following story:\n\nStory 1: {story_1}\n\nNow consider two more stories:\n\nStory A: {story_b}\n\nStory B: {story_a}\n\nWhich of Story A and Story B is a better analogy to Story 1? Is the best answer Story A, Story B, or both are equally analogous?"
+    response = client.chat.completions.create(
+        model= versions[id]['deployment_name'],#"gpt-4-1106-Preview", # model = "deployment_name".
+        messages=[
+            {"role": "system", "content": "You are a helpful assistant."},
+            {"role": "user", "content": prompt_1},
+            ]
+    )
+    gpt_responses[k]['order_1'] = response.choices[0].message.content
+
+    response = client.chat.completions.create(
+        model= versions[id]['deployment_name'], # model = "deployment_name".
+        messages=[
+            {"role": "system", "content": "You are a helpful assistant."},
+            {"role": "user", "content": prompt_2},
+            ]
+    )
+    gpt_responses[k]['order_2'] = response.choices[0].message.content
+
+json_string = json.dumps(gpt_responses, indent=2)
+
+with open(f'gpt_results/gpt_{id}_responses_dict_{no}.json', 'w') as json_f:
+    json_f.write(json_string)
+
diff --git a/stories/gpt_results/gpt_0613_responses_dict_new.json b/stories/gpt_results/gpt_0613_responses_dict_new.json
diff --git a/stories/gpt_results/gpt_0613_responses_dict_orig.json b/stories/gpt_results/gpt_0613_responses_dict_orig.json
diff --git a/stories/gpt_results/gpt_stories_original.csv b/stories/gpt_results/gpt_stories_original.csv
@@ -0,0 +1,37 @@
+id,task,response,prob_ind,correct
+gpt,1,0,0,1
+gpt,2,0,0,1
+gpt,3,0,0,1
+gpt,4,0,0,1
+gpt,5,0,0,1
+gpt,6,0,0,1
+gpt,7,0,0,1
+gpt,8,0,0,1
+gpt,9,0,0,1
+gpt,10,0,0,1
+gpt,11,0,0,1
+gpt,12,0,0,1
+gpt,13,0,0,1
+gpt,14,0,0,1
+gpt,15,0,0,1
+gpt,16,0,0,1
+gpt,17,0,0,1
+gpt,18,0,0,1
+gpt,1,0,1,0
+gpt,2,1,1,1
+gpt,3,1,1,1
+gpt,4,1,1,1
+gpt,5,1,1,1
+gpt,6,1,1,1
+gpt,7,0,1,0
+gpt,8,0,1,0
+gpt,9,1,1,1
+gpt,10,1,1,1
+gpt,11,1,1,1
+gpt,12,1,1,1
+gpt,13,0,1,0
+gpt,14,1,1,1
+gpt,15,0,1,0
+gpt,16,1,1,1
+gpt,17,1,1,1
+gpt,18,0,1,1
diff --git a/stories/gpt_results/gpt_stories_rewritten.csv b/stories/gpt_results/gpt_stories_rewritten.csv
@@ -0,0 +1,37 @@
+id,task,response,prob_ind,correct
+gpt,1,1,0,0
+gpt,2,1,0,0
+gpt,3,1,0,0
+gpt,4,0,0,1
+gpt,5,0,0,1
+gpt,6,0,0,1
+gpt,7,0,0,1
+gpt,8,0,0,1
+gpt,9,0,0,1
+gpt,10,0,0,1
+gpt,11,0,0,1
+gpt,12,0,0,1
+gpt,13,0,0,1
+gpt,14,0,0,1
+gpt,15,0,0,1
+gpt,16,0,0,1
+gpt,17,0,0,1
+gpt,18,1,0,0
+gpt,1,0,1,0
+gpt,2,1,1,1
+gpt,3,0,1,0
+gpt,4,1,1,1
+gpt,5,1,1,1
+gpt,6,1,1,1
+gpt,7,1,1,1
+gpt,8,0,1,0
+gpt,9,1,1,1
+gpt,10,1,1,1
+gpt,11,1,1,1
+gpt,12,1,1,1
+gpt,13,0,1,0
+gpt,14,1,1,1
+gpt,15,0,1,0
+gpt,16,1,1,1
+gpt,17,1,1,1
+gpt,18,0,1,0