@@ -30,10 +30,10 @@
"execution_count": 1,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:52.31740 6Z",
"iopub.status.busy": "2023-02-13 T23:40:52.316561 Z",
"iopub.status.idle": "2023-02-13 T23:40:52.321193 Z",
"shell.execute_reply": "2023-02-13 T23:40:52.320628 Z"
"iopub.execute_input": "2023-02-24 T23:25:36.91096 6Z",
"iopub.status.busy": "2023-02-24 T23:25:36.910473 Z",
"iopub.status.idle": "2023-02-24 T23:25:36.914554 Z",
"shell.execute_reply": "2023-02-24 T23:25:36.914030 Z"
}
},
"outputs": [],
@@ -54,10 +54,10 @@
"execution_count": 2,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:52.324240 Z",
"iopub.status.busy": "2023-02-13 T23:40:52.323783 Z",
"iopub.status.idle": "2023-02-13 T23:40:52.330570 Z",
"shell.execute_reply": "2023-02-13 T23:40:52.329750 Z"
"iopub.execute_input": "2023-02-24 T23:25:36.917301 Z",
"iopub.status.busy": "2023-02-24 T23:25:36.917011 Z",
"iopub.status.idle": "2023-02-24 T23:25:36.923156 Z",
"shell.execute_reply": "2023-02-24 T23:25:36.922619 Z"
}
},
"outputs": [],
@@ -81,10 +81,10 @@
"execution_count": 3,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:52.333547 Z",
"iopub.status.busy": "2023-02-13 T23:40:52.333249 Z",
"iopub.status.idle": "2023-02-13 T23:40:52.336508 Z",
"shell.execute_reply": "2023-02-13 T23:40:52.335858 Z"
"iopub.execute_input": "2023-02-24 T23:25:36.925804 Z",
"iopub.status.busy": "2023-02-24 T23:25:36.925423 Z",
"iopub.status.idle": "2023-02-24 T23:25:36.928191 Z",
"shell.execute_reply": "2023-02-24 T23:25:36.927673 Z"
}
},
"outputs": [],
@@ -109,10 +109,10 @@
"execution_count": 4,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:52.339977 Z",
"iopub.status.busy": "2023-02-13 T23:40:52.339556 Z",
"iopub.status.idle": "2023-02-13 T23:40:54.60334 9Z",
"shell.execute_reply": "2023-02-13 T23:40:54.602630 Z"
"iopub.execute_input": "2023-02-24 T23:25:36.931255 Z",
"iopub.status.busy": "2023-02-24 T23:25:36.930838 Z",
"iopub.status.idle": "2023-02-24 T23:25:39.14879 9Z",
"shell.execute_reply": "2023-02-24 T23:25:39.148113 Z"
}
},
"outputs": [
@@ -126,7 +126,7 @@
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "454146d0f7224f038689031002906e6f ",
"model_id": "35cd066a31b242bb87b2c106ee72e5f2 ",
"version_major": 2,
"version_minor": 0
},
@@ -186,10 +186,10 @@
"execution_count": 5,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:54.607152 Z",
"iopub.status.busy": "2023-02-13 T23:40:54.60644 1Z",
"iopub.status.idle": "2023-02-13 T23:40:54.610504 Z",
"shell.execute_reply": "2023-02-13 T23:40:54.609759 Z"
"iopub.execute_input": "2023-02-24 T23:25:39.152156 Z",
"iopub.status.busy": "2023-02-24 T23:25:39.15153 1Z",
"iopub.status.idle": "2023-02-24 T23:25:39.155313 Z",
"shell.execute_reply": "2023-02-24 T23:25:39.154731 Z"
},
"slideshow": {
"slide_type": "subslide"
@@ -238,10 +238,10 @@
"execution_count": 6,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:54.613590 Z",
"iopub.status.busy": "2023-02-13 T23:40:54.613168 Z",
"iopub.status.idle": "2023-02-13 T23:40:54.616873 Z",
"shell.execute_reply": "2023-02-13 T23:40:54.616193 Z"
"iopub.execute_input": "2023-02-24 T23:25:39.158398 Z",
"iopub.status.busy": "2023-02-24 T23:25:39.157766 Z",
"iopub.status.idle": "2023-02-24 T23:25:39.161396 Z",
"shell.execute_reply": "2023-02-24 T23:25:39.160797 Z"
}
},
"outputs": [
@@ -287,10 +287,10 @@
"execution_count": 7,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:54.6196 18Z",
"iopub.status.busy": "2023-02-13 T23:40:54.619218 Z",
"iopub.status.idle": "2023-02-13 T23:40:54.624272 Z",
"shell.execute_reply": "2023-02-13 T23:40:54.623664 Z"
"iopub.execute_input": "2023-02-24 T23:25:39.164 187 Z",
"iopub.status.busy": "2023-02-24 T23:25:39.163867 Z",
"iopub.status.idle": "2023-02-24 T23:25:39.169009 Z",
"shell.execute_reply": "2023-02-24 T23:25:39.168427 Z"
}
},
"outputs": [],
@@ -337,10 +337,10 @@
"execution_count": 8,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:54.626998 Z",
"iopub.status.busy": "2023-02-13 T23:40:54.626593 Z",
"iopub.status.idle": "2023-02-13 T23:40:54.63138 3Z",
"shell.execute_reply": "2023-02-13 T23:40:54.63077 0Z"
"iopub.execute_input": "2023-02-24 T23:25:39.171752 Z",
"iopub.status.busy": "2023-02-24 T23:25:39.171347 Z",
"iopub.status.idle": "2023-02-24 T23:25:39.17634 3Z",
"shell.execute_reply": "2023-02-24 T23:25:39.17551 0Z"
}
},
"outputs": [],
@@ -391,10 +391,10 @@
"execution_count": 9,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:54.634335 Z",
"iopub.status.busy": "2023-02-13 T23:40:54.633929 Z",
"iopub.status.idle": "2023-02-13 T23:40:56.10570 0Z",
"shell.execute_reply": "2023-02-13 T23:40:56.105085 Z"
"iopub.execute_input": "2023-02-24 T23:25:39.179030 Z",
"iopub.status.busy": "2023-02-24 T23:25:39.178624 Z",
"iopub.status.idle": "2023-02-24 T23:25:40.58441 0Z",
"shell.execute_reply": "2023-02-24 T23:25:40.583802 Z"
},
"slideshow": {
"slide_type": "slide"
@@ -418,10 +418,10 @@
"execution_count": 10,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:56.109177 Z",
"iopub.status.busy": "2023-02-13 T23:40:56.108624 Z",
"iopub.status.idle": "2023-02-13 T23:40:56.112651 Z",
"shell.execute_reply": "2023-02-13 T23:40:56.112076 Z"
"iopub.execute_input": "2023-02-24 T23:25:40.587815 Z",
"iopub.status.busy": "2023-02-24 T23:25:40.587283 Z",
"iopub.status.idle": "2023-02-24 T23:25:40.590826 Z",
"shell.execute_reply": "2023-02-24 T23:25:40.590158 Z"
},
"slideshow": {
"slide_type": "slide"
@@ -483,10 +483,10 @@
"execution_count": 11,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:40:56.11538 3Z",
"iopub.status.busy": "2023-02-13 T23:40:56.114975 Z",
"iopub.status.idle": "2023-02-13 T23:41:55.045654 Z",
"shell.execute_reply": "2023-02-13 T23:41:55.044973 Z"
"iopub.execute_input": "2023-02-24 T23:25:40.59360 3Z",
"iopub.status.busy": "2023-02-24 T23:25:40.593269 Z",
"iopub.status.idle": "2023-02-24 T23:26:38.349191 Z",
"shell.execute_reply": "2023-02-24 T23:26:38.348392 Z"
}
},
"outputs": [
@@ -494,119 +494,119 @@
"name": "stderr",
"output_type": "stream",
"text": [
"\u001b[32m[I 2023-02-13 23:40:56,159 ]\u001b[0m A new study created in memory with name: optuna\u001b[0m\n"
"\u001b[32m[I 2023-02-24 23:25:40,643 ]\u001b[0m A new study created in memory with name: optuna\u001b[0m\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"\u001b[32m[I 2023-02-13 23:40:56,161 ]\u001b[0m A new study created in memory with name: optuna\u001b[0m\n"
"\u001b[32m[I 2023-02-24 23:25:40,646 ]\u001b[0m A new study created in memory with name: optuna\u001b[0m\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:40:56 ] {806 } INFO - trial 1 config: {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:25:40 ] {811 } INFO - trial 1 config: {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:40:59 ] {215} INFO - result: {'expected_success': 0.6, 'success': 0.6, 'total_cost': 0.4624999999999999, 'cost': 0.4624999999999999, 'inference_cost': 0.023125, 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}, 'config/model': 'code-davinci-002', 'config/temperature_or_top_p': {'temperature': 0.36865945026811975}, 'config/max_tokens': 347, 'config/n': 1, 'config/prompt': 1, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 3.70 16141414642334 }\n"
"[flaml.tune.tune: 02-24 23:25:44 ] {215} INFO - result: {'expected_success': 0.6, 'success': 0.6, 'total_cost': 0.4624999999999999, 'cost': 0.4624999999999999, 'inference_cost': 0.023125, 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}, 'config/model': 'code-davinci-002', 'config/temperature_or_top_p': {'temperature': 0.36865945026811975}, 'config/max_tokens': 347, 'config/n': 1, 'config/prompt': 1, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 3.68 7161445617676 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:40:59 ] {806 } INFO - trial 2 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:25:44 ] {811 } INFO - trial 2 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:00 ] {215} INFO - result: {'expected_success': 0.35, 'success': 0.35, 'total_cost': 0.5671159999999997, 'cost': 0.104616, 'inference_cost': 0.0052308, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'temperature': 0.36865945026811975}, 'config/max_tokens': 347, 'config/n': 1, 'config/prompt': 1, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.673302412033081 }\n"
"[flaml.tune.tune: 02-24 23:25:45 ] {215} INFO - result: {'expected_success': 0.35, 'success': 0.35, 'total_cost': 0.5671159999999997, 'cost': 0.104616, 'inference_cost': 0.0052308, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.36865945026811975}, 'max_tokens': 347, 'n': 1, 'prompt': 1, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'temperature': 0.36865945026811975}, 'config/max_tokens': 347, 'config/n': 1, 'config/prompt': 1, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.6666913032531738 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:00 ] {806 } INFO - trial 3 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.4985070123025904}, 'max_tokens': 97, 'n': 20, 'prompt': 0, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:25:45 ] {811 } INFO - trial 3 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.4985070123025904}, 'max_tokens': 97, 'n': 20, 'prompt': 0, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:17 ] {215} INFO - result: {'expected_success': 0.5080706992649381, 'success': 0.55, 'total_cost': 1.1848 999999999996 , 'cost': 0.617784 , 'inference_cost': 0.0287676, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.4985070123025904}, 'max_tokens': 97, 'n': 20, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.4985070123025904}, 'config/max_tokens': 97, 'config/n': 20, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 16.56331181526184 }\n"
"[flaml.tune.tune: 02-24 23:26:01 ] {215} INFO - result: {'expected_success': 0.5080706992649381, 'success': 0.55, 'total_cost': 1.142467 9999999998 , 'cost': 0.575352 , 'inference_cost': 0.0287676, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.4985070123025904}, 'max_tokens': 97, 'n': 20, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.4985070123025904}, 'config/max_tokens': 97, 'config/n': 20, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 16.66586470603943 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:17 ] {806 } INFO - trial 4 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:26:01 ] {811 } INFO - trial 4 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:51 ] {215} INFO - result: {'expected_success': 0.6186627404336135, 'success': 0.65, 'total_cost': 2.423971 9999999987, 'cost': 1.239072 0000000002, 'inference_cost': 0.059620799999999995, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.6125260668293881}, 'config/max_tokens': 433, 'config/n': 29, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 34.5770759582519 5}\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {215} INFO - result: {'expected_success': 0.6186627404336135, 'success': 0.65, 'total_cost': 2.369347 9999999987, 'cost': 1.226880 0000000002, 'inference_cost': 0.059620799999999995, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.6125260668293881}, 'config/max_tokens': 433, 'config/n': 29, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 36.60513043403625 5}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:51 ] {806 } INFO - trial 5 config: {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.6177669784693172}, 'max_tokens': 231, 'n': 65, 'prompt': 3, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {811 } INFO - trial 5 config: {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.6177669784693172}, 'max_tokens': 231, 'n': 65, 'prompt': 3, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:51 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 2.635671 9999999987 , 'cost': 0.2117 , 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.6177669784693172}, 'max_tokens': 231, 'n': 65, 'prompt': 3, 'stop': 0}, 'config/model': 'code-davinci-002', 'config/temperature_or_top_p': {'temperature': 0.6177669784693172}, 'config/max_tokens': 231, 'config/n': 65, 'config/prompt': 3, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.0022132396697998047 }\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 2.529547 9999999984 , 'cost': 0.1602 , 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'temperature_or_top_p': {'temperature': 0.6177669784693172}, 'max_tokens': 231, 'n': 65, 'prompt': 3, 'stop': 0}, 'config/model': 'code-davinci-002', 'config/temperature_or_top_p': {'temperature': 0.6177669784693172}, 'config/max_tokens': 231, 'config/n': 65, 'config/prompt': 3, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.0020499229431152344 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:51 ] {806 } INFO - trial 6 config: {'model': 'code-davinci-002', 'max_tokens': 263, 'n': 41, 'prompt': 0, 'stop': 0, 'temperature_or_top_p': {'top_p': 0.49834557213253655}}\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {811 } INFO - trial 6 config: {'model': 'code-davinci-002', 'max_tokens': 263, 'n': 41, 'prompt': 0, 'stop': 0, 'temperature_or_top_p': {'top_p': 0.49834557213253655}}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:54 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 3.0031719 99999999, 'cost': 0.3675 , 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'max_tokens': 263, 'n': 41, 'prompt': 0, 'stop': 0, 'temperature_or_top_p': {'top_p': 0.49834557213253655}}, 'config/model': 'code-davinci-002', 'config/max_tokens': 263, 'config/n': 41, 'config/prompt': 0, 'config/stop': 0, 'config/temperature_or_top_p': {'top_p': 0.49834557213253655}, 'experiment_tag': 'exp', 'time_total_s': 3.3002660274505615 }\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 2.857847 9999999984 , 'cost': 0.32830000000000004 , 'training_iteration': 0, 'config': {'model': 'code-davinci-002', 'max_tokens': 263, 'n': 41, 'prompt': 0, 'stop': 0, 'temperature_or_top_p': {'top_p': 0.49834557213253655}}, 'config/model': 'code-davinci-002', 'config/max_tokens': 263, 'config/n': 41, 'config/prompt': 0, 'config/stop': 0, 'config/temperature_or_top_p': {'top_p': 0.49834557213253655}, 'experiment_tag': 'exp', 'time_total_s': 0.002808809280395508 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:55 ] {806 } INFO - trial 7 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.8286813263076767}, 'max_tokens': 57, 'n': 63, 'prompt': 3, 'stop': 0}\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {811 } INFO - trial 7 config: {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.8286813263076767}, 'max_tokens': 57, 'n': 63, 'prompt': 3, 'stop': 0}\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:55 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 4.046379 999999999, 'cost': 1.043208 , 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.8286813263076767}, 'max_tokens': 57, 'n': 63, 'prompt': 3, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'temperature': 0.8286813263076767}, 'config/max_tokens': 57, 'config/n': 63, 'config/prompt': 3, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.007852792739868164 }\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {215} INFO - result: {'expected_success': 0, 'total_cost': 4.028831 999999999, 'cost': 1.170984 , 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'temperature': 0.8286813263076767}, 'max_tokens': 57, 'n': 63, 'prompt': 3, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'temperature': 0.8286813263076767}, 'config/max_tokens': 57, 'config/n': 63, 'config/prompt': 3, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 0.015198230743408203 }\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"[flaml.tune.tune: 02-13 23:41:55 ] {827 } WARNING - fail to sample a trial for 100 times in a row, stopping.\n"
"[flaml.tune.tune: 02-24 23:26:38 ] {834 } WARNING - fail to sample a trial for 100 times in a row, stopping.\n"
]
}
],
@@ -656,10 +656,10 @@
"execution_count": 12,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:41:55.049204 Z",
"iopub.status.busy": "2023-02-13 T23:41:55.048871 Z",
"iopub.status.idle": "2023-02-13 T23:41:55.053284 Z",
"shell.execute_reply": "2023-02-13 T23:41:55.052574 Z"
"iopub.execute_input": "2023-02-24 T23:26:38.352710 Z",
"iopub.status.busy": "2023-02-24 T23:26:38.352378 Z",
"iopub.status.idle": "2023-02-24 T23:26:38.356939 Z",
"shell.execute_reply": "2023-02-24 T23:26:38.356217 Z"
}
},
"outputs": [
@@ -668,7 +668,7 @@
"output_type": "stream",
"text": [
"optimized config {'model': 'code-cushman-001', 'max_tokens': 433, 'n': 29, 'prompt': '{prompt}', 'stop': ['\\nclass', '\\ndef', '\\nif', '\\nprint'], 'top_p': 0.6125260668293881}\n",
"best result on tuning data {'expected_success': 0.6186627404336135, 'success': 0.65, 'total_cost': 2.423971 9999999987, 'cost': 1.239072 0000000002, 'inference_cost': 0.059620799999999995, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.6125260668293881}, 'config/max_tokens': 433, 'config/n': 29, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 34.5770759582519 5}\n"
"best result on tuning data {'expected_success': 0.6186627404336135, 'success': 0.65, 'total_cost': 2.369347 9999999987, 'cost': 1.226880 0000000002, 'inference_cost': 0.059620799999999995, 'training_iteration': 0, 'config': {'model': 'code-cushman-001', 'temperature_or_top_p': {'top_p': 0.6125260668293881}, 'max_tokens': 433, 'n': 29, 'prompt': 0, 'stop': 0}, 'config/model': 'code-cushman-001', 'config/temperature_or_top_p': {'top_p': 0.6125260668293881}, 'config/max_tokens': 433, 'config/n': 29, 'config/prompt': 0, 'config/stop': 0, 'experiment_tag': 'exp', 'time_total_s': 36.60513043403625 5}\n"
]
}
],
@@ -696,10 +696,10 @@
"execution_count": 13,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:41:55.056205 Z",
"iopub.status.busy": "2023-02-13 T23:41:55.055631 Z",
"iopub.status.idle": "2023-02-13 T23:41:56.0 39259 Z",
"shell.execute_reply": "2023-02-13 T23:41:56.038427 Z"
"iopub.execute_input": "2023-02-24 T23:26:38.359902 Z",
"iopub.status.busy": "2023-02-24 T23:26:38.359506 Z",
"iopub.status.idle": "2023-02-24 T23:26:39.34 3921 Z",
"shell.execute_reply": "2023-02-24 T23:26:39.343051 Z"
},
"slideshow": {
"slide_type": "subslide"
@@ -921,7 +921,7 @@
"source": [
"### Evaluate the success rate on the test data\n",
"\n",
"You can use flaml's `oai.Completion.eval` to evaluate the performance of an entire dataset with the tuned config. To do that you need to set `oai.Completion.data` to the data to evaluate. The following code will take a while to evaluate all the 144 test data instances. Compared to the baseline success rate (0. 46) on the [HELM benchmark](https://crfm.stanford.edu/helm/latest/?group=code_humaneval), the tuned config has a success rate of 0. 68. It can be further improved if the inference budget and optimization budget are further increased."
"You can use flaml's `oai.Completion.eval` to evaluate the performance of an entire dataset with the tuned config. To do that you need to set `oai.Completion.data` to the data to evaluate. The following code will take a while to evaluate all the 144 test data instances. Compared to the baseline success rate (46% ) on the [HELM benchmark](https://crfm.stanford.edu/helm/latest/?group=code_humaneval), the tuned config has a success rate of 68% . It can be further improved if the inference budget and optimization budget are further increased."
]
},
{
@@ -929,10 +929,10 @@
"execution_count": 14,
"metadata": {
"execution": {
"iopub.execute_input": "2023-02-13 T23:41:56.042764 Z",
"iopub.status.busy": "2023-02-13 T23:41:56.042086 Z",
"iopub.status.idle": "2023-02-13 T23:53:05.597643 Z",
"shell.execute_reply": "2023-02-13 T23:53:05.596603 Z"
"iopub.execute_input": "2023-02-24 T23:26:39.347295 Z",
"iopub.status.busy": "2023-02-24 T23:26:39.346994 Z",
"iopub.status.idle": "2023-02-24 T23:29:27.160335 Z",
"shell.execute_reply": "2023-02-24 T23:29:27.159519 Z"
}
},
"outputs": [
@@ -940,7 +940,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
"{'expected_success': 0.6364503360372493, 'success': 0.6805555555555556, 'total_cost': 12.227739 999999997, 'cost': 8.181360000000003, 'inference_cost': 0.056815}\n"
"{'expected_success': 0.6364503360372493, 'success': 0.6805555555555556, 'total_cost': 12.210191 999999997, 'cost': 8.181360000000003, 'inference_cost': 0.056815}\n"
]
}
],
@@ -977,60 +977,25 @@
"widgets": {
"application/vnd.jupyter.widget-state+json": {
"state": {
"2d910cfd2d2a4fc49fc30fbbdc5576a7 ": {
"model_module": "@jupyter-widgets/base ",
"24dd93300e0442788ee6cc1310e5bf14 ": {
"model_module": "@jupyter-widgets/controls ",
"model_module_version": "2.0.0",
"model_name": "Layout Model",
"model_name": "HTMLStyle Model",
"state": {
"_model_module": "@jupyter-widgets/base ",
"_model_module": "@jupyter-widgets/controls ",
"_model_module_version": "2.0.0",
"_model_name": "Layout Model",
"_model_name": "HTMLStyle Model",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "Layout View",
"align_content ": null,
"align_items": null ,
"align_self ": null,
"border_bottom ": null,
"border_left": null,
"border_right": null,
"border_top": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
"_view_name": "Style View",
"background ": null,
"description_width": "" ,
"font_size ": null,
"text_color ": null
}
},
"454146d0f7224f038689031002906e6f ": {
"35cd066a31b242bb87b2c106ee72e5f2 ": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HBoxModel",
@@ -1045,95 +1010,34 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_e4ae2b6f5a974fd4bafb6abb9d12ff26 ",
"IPY_MODEL_577e1e3cc4db4942b0883577b3b52755 ",
"IPY_MODEL_b40bdfb1ac1d4cffb7cefcb870c64d45 "
"IPY_MODEL_8e7ee7687a99410d88a98a74ecfcea99 ",
"IPY_MODEL_421e02a11a974b40b3ddb75382b3b640 ",
"IPY_MODEL_77db9797e78b49438d21c5c8da34b4cb "
],
"layout": "IPY_MODEL_dc83c7bff2f241309537a8119dfc7555 ",
"layout": "IPY_MODEL_47d3046236a54b0e8f9ae455a82c7e0b ",
"tabbable": null,
"tooltip": null
}
},
"577e1e3cc4db4942b0883577b3b52755 ": {
"3d5d106a38954af2bb3bde5777702f4e ": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "FloatProgress Model",
"model_name": "HTMLStyle Model",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "2.0.0",
"_model_name": "FloatProgress Model",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "2.0.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_allow_html": false,
"layout": "IPY_MODEL_2d910cfd2d2a4fc49fc30fbbdc5576a7",
"max": 1,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_74a6ba0c3cbc4051be0a83e152fe1e62",
"tabbable": null,
"tooltip": null,
"value": 1
}
},
"6086462a12d54bafa59d3c4566f06cb2": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "2.0.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "2.0.0",
"_model_name": "LayoutModel",
"_model_name": "HTMLStyle Model",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "Layout View",
"align_content ": null,
"align_items": null ,
"align_self ": null,
"border_bottom ": null,
"border_left": null,
"border_right": null,
"border_top": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
"_view_name": "Style View",
"background ": null,
"description_width": "" ,
"font_size ": null,
"text_color ": null
}
},
"74a6ba0c3cbc4051be0a83e152fe1e62 ": {
"3e1ebb31412443b0bca86a301cbdac11 ": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "ProgressStyleModel",
@@ -1149,66 +1053,33 @@
"description_width": ""
}
},
"7d3f3d9e15894d05a4d188ff4f466554 ": {
"421e02a11a974b40b3ddb75382b3b640 ": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HTMLStyle Model",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "2.0.0",
"_model_name": "HTMLStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "StyleView",
"background": null,
"description_width": "",
"font_size": null,
"text_color": null
}
},
"b40bdfb1ac1d4cffb7cefcb870c64d45": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HTMLModel",
"model_name": "FloatProgress Model",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "2.0.0",
"_model_name": "HTML Model",
"_model_name": "FloatProgress Model",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "2.0.0",
"_view_name": "HTML View",
"_view_name": "Progress View",
"bar_style": "success",
"description": "",
"description_allow_html": false,
"layout": "IPY_MODEL_f1355871cc6f4dd4b50d9df5af20e5c8 ",
"placeholder": " " ,
"style": "IPY_MODEL_ca245376fd9f4354af6b2befe4af4466" ,
"layout": "IPY_MODEL_e6398d4027c9459a97965b9d91ae484f ",
"max": 1 ,
"min": 0 ,
"orientation": "horizontal",
"style": "IPY_MODEL_3e1ebb31412443b0bca86a301cbdac11",
"tabbable": null,
"tooltip": null,
"value": " 1/1 [00:00<00:00, 44.69it/s]"
"value": 1
}
},
"ca245376fd9f4354af6b2befe4af4466 ": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HTMLStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "2.0.0",
"_model_name": "HTMLStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "StyleView",
"background": null,
"description_width": "",
"font_size": null,
"text_color": null
}
},
"dc83c7bff2f241309537a8119dfc7555": {
"47d3046236a54b0e8f9ae455a82c7e0b ": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "2.0.0",
"model_name": "LayoutModel",
@@ -1261,7 +1132,60 @@
"width": null
}
},
"e4ae2b6f5a974fd4bafb6abb9 d12 ff26 ": {
"754800f7feb04acea977696e4787 d1ff": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "2.0.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "2.0.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border_bottom": null,
"border_left": null,
"border_right": null,
"border_top": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"77db9797e78b49438d21c5c8da34b4cb": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HTMLModel",
@@ -1276,15 +1200,91 @@
"_view_name": "HTMLView",
"description": "",
"description_allow_html": false,
"layout": "IPY_MODEL_6086462a12d54bafa59d3c4566f06cb2 ",
"layout": "IPY_MODEL_7b6c4e1c11e249409a1edcd63be450d8 ",
"placeholder": " ",
"style": "IPY_MODEL_7d3f3d9e15894d05a4d188ff4f466554 ",
"style": "IPY_MODEL_3d5d106a38954af2bb3bde5777702f4e ",
"tabbable": null,
"tooltip": null,
"value": " 1/1 [00:00<00:00, 44.40it/s]"
}
},
"7b6c4e1c11e249409a1edcd63be450d8": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "2.0.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "2.0.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "2.0.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border_bottom": null,
"border_left": null,
"border_right": null,
"border_top": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"8e7ee7687a99410d88a98a74ecfcea99": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "2.0.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "2.0.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "2.0.0",
"_view_name": "HTMLView",
"description": "",
"description_allow_html": false,
"layout": "IPY_MODEL_754800f7feb04acea977696e4787d1ff",
"placeholder": " ",
"style": "IPY_MODEL_24dd93300e0442788ee6cc1310e5bf14",
"tabbable": null,
"tooltip": null,
"value": "100%"
}
},
"f1355871cc6f4dd4b50d9df5af20e5c8 ": {
"e6398d4027c9459a97965b9d91ae484f ": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "2.0.0",
"model_name": "LayoutModel",