-
Notifications
You must be signed in to change notification settings - Fork 0
/
eval_LLMs.sh
42 lines (30 loc) · 6.86 KB
/
eval_LLMs.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
# AsocialBox (6 in cont)
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model text-ada-001 --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-3.5-turbo-0613 --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-3.5-turbo-instruct-0914 --env-args size 7 --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-4-0613 --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model text-davinci-003 --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model bloom_560m --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model random --env-args size 7 --skip-check --env-name SocialAI-AsocialBoxInformationSeekingParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_asocialbox_SocialAI-AsocialBoxInformationSeekingParamEnv-v1_2023_07_19_19_28_48/episodes.pkl
### ColorBoxes
# 10 episodes
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model text-ada-001 --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-3.5-turbo-0613 --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-4-0613 --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model text-davinci-003 --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model bloom_560m --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model random --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
# 20 episodes
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model gpt-4-0613 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model gpt-3.5-turbo-0613 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model gpt-3.5-turbo-instruct-0914 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model text-ada-001 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model text-davinci-003 --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model random --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model bloom_560m --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_colorbox_SocialAI-ColorBoxesLLMCSParamEnv-v1_2023_07_20_13_11_54/episodes.pkl
### ColorBoxes generalization
# 10 episodes generalization
#python -m scripts.LLM_test --episodes 10 --max-steps 15 --model gpt-4-0613 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_SocialAI-ColorLLMCSParamEnv-v1_2023_09_18_17_24_24/episodes.pkl
# 20 episodes generalization
#python -m scripts.LLM_test --episodes 20 --max-steps 15 --model gpt-4-0613 --env-args size 7 --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_SocialAI-ColorLLMCSParamEnv-v1_2023_09_18_17_24_24/episodes.pkl
python -m scripts.LLM_test --episodes 20 --max-steps 15 --model random --env-args size 7 --skip-check --env-name SocialAI-ColorBoxesLLMCSParamEnv-v1 --in-context-path llm_data/in_context_examples/in_context_SocialAI-ColorLLMCSParamEnv-v1_2023_09_18_17_24_24/episodes.pkl