Upload folder using huggingface_hub
Browse files- compile_result/gsm8k_train/pass_for_train.jsonl +0 -0
- compile_result/lean4_basic_test/lean4_random_15k_rftpass5.jsonl +5 -0
- compile_result/lean4_basic_test/output.log +13 -3
- compile_result/lean4_random_test/output.log +10 -28
- compile_result/math_train/output.log +0 -0
- compile_result/math_train/pass_for_train.jsonl +0 -0
- compile_result/wild_test/lean4_random_15k_rftpass5.jsonl +0 -0
- compile_result/wild_test/output.log +3 -3
- compile_result/wild_test_v2/lean4_random_15k_rftpass5.jsonl +0 -0
- compile_result/wild_test_v2/output.log +6 -0
- pass_rate_multi_pass.py +5 -3
- pass_rate_new_test.py +1 -1
- trans_from_compile_4_training.py +1 -1
compile_result/gsm8k_train/pass_for_train.jsonl
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
compile_result/lean4_basic_test/lean4_random_15k_rftpass5.jsonl
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"results": [],
|
3 |
+
"pass_1": 0,
|
4 |
+
"pass_5": 0
|
5 |
+
}
|
compile_result/lean4_basic_test/output.log
CHANGED
@@ -1,6 +1,16 @@
|
|
1 |
-
|
2 |
-
Pass@1: 0.
|
3 |
-
Pass@5: 0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
|
5 |
|
6 |
|
|
|
1 |
+
|
2 |
+
Pass@1: 0.1762295081967213
|
3 |
+
Pass@5: 0.29508196721311475
|
4 |
+
Traceback (most recent call last):
|
5 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 273, in <module>
|
6 |
+
main(args)
|
7 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 259, in main
|
8 |
+
multi(command_list, args.output_path, args.k)
|
9 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 209, in multi
|
10 |
+
os.makedirs(os.path.dirname(output_file), exist_ok=True)
|
11 |
+
File "/usr/lib/python3.9/os.py", line 225, in makedirs
|
12 |
+
mkdir(name, mode)
|
13 |
+
FileNotFoundError: [Errno 2] No such file or directory: ''
|
14 |
|
15 |
|
16 |
|
compile_result/lean4_random_test/output.log
CHANGED
@@ -1,34 +1,16 @@
|
|
1 |
-
|
|
|
|
|
2 |
Traceback (most recent call last):
|
3 |
-
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line
|
4 |
-
result = future.result()
|
5 |
-
File "/usr/lib/python3.9/concurrent/futures/_base.py", line 435, in result
|
6 |
-
self._condition.wait(timeout)
|
7 |
-
File "/usr/lib/python3.9/threading.py", line 312, in wait
|
8 |
-
waiter.acquire()
|
9 |
-
KeyboardInterrupt
|
10 |
-
|
11 |
-
During handling of the above exception, another exception occurred:
|
12 |
-
|
13 |
-
Traceback (most recent call last):
|
14 |
-
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 266, in <module>
|
15 |
main(args)
|
16 |
-
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line
|
17 |
multi(command_list, args.output_path, args.k)
|
18 |
-
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line
|
19 |
-
|
20 |
-
File "/usr/lib/python3.9/
|
21 |
-
|
22 |
-
|
23 |
-
t.join()
|
24 |
-
File "/usr/lib/python3.9/threading.py", line 1033, in join
|
25 |
-
self._wait_for_tstate_lock()
|
26 |
-
File "/usr/lib/python3.9/threading.py", line 1049, in _wait_for_tstate_lock
|
27 |
-
elif lock.acquire(block, timeout):
|
28 |
-
KeyboardInterrupt
|
29 |
-
|
30 |
-
Pass@1: 0.14285714285714285
|
31 |
-
Pass@5: 0.23949579831932774
|
32 |
|
33 |
|
34 |
|
|
|
1 |
+
|
2 |
+
Pass@1: 0.15126050420168066
|
3 |
+
Pass@5: 0.2605042016806723
|
4 |
Traceback (most recent call last):
|
5 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 273, in <module>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
main(args)
|
7 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 259, in main
|
8 |
multi(command_list, args.output_path, args.k)
|
9 |
+
File "/opt/tiger/lean4-compile/pass_rate_new_test.py", line 209, in multi
|
10 |
+
os.makedirs(os.path.dirname(output_file), exist_ok=True)
|
11 |
+
File "/usr/lib/python3.9/os.py", line 225, in makedirs
|
12 |
+
mkdir(name, mode)
|
13 |
+
FileNotFoundError: [Errno 2] No such file or directory: ''
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
14 |
|
15 |
|
16 |
|
compile_result/math_train/output.log
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
compile_result/math_train/pass_for_train.jsonl
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
compile_result/wild_test/lean4_random_15k_rftpass5.jsonl
ADDED
The diff for this file is too large to render.
See raw diff
|
|
compile_result/wild_test/output.log
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
-
|
2 |
-
Pass@1: 0.
|
3 |
-
Pass@5: 0.
|
4 |
|
5 |
|
6 |
|
|
|
1 |
+
|
2 |
+
Pass@1: 0.297
|
3 |
+
Pass@5: 0.516
|
4 |
|
5 |
|
6 |
|
compile_result/wild_test_v2/lean4_random_15k_rftpass5.jsonl
ADDED
The diff for this file is too large to render.
See raw diff
|
|
compile_result/wild_test_v2/output.log
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
Pass@1: 0.187
|
3 |
+
Pass@5: 0.392
|
4 |
+
|
5 |
+
|
6 |
+
|
pass_rate_multi_pass.py
CHANGED
@@ -26,11 +26,13 @@ def get_output(input_string, k):
|
|
26 |
|
27 |
# List of input paths
|
28 |
input_path_lists = [
|
29 |
-
# "/opt/tiger/formal-align/generate_result/zero_shot/lean4_random_test/generation/
|
30 |
-
# "/opt/tiger/formal-align/generate_result/zero_shot/lean4_basic_test/generation/
|
31 |
-
"/opt/tiger/formal-align/generate_result/zero_shot/
|
32 |
# "/opt/tiger/formal-align/generate_result/zero_shot/gsm8k_train/generation/lean4_random_15k/10",
|
33 |
# "/opt/tiger/formal-align/generate_result/zero_shot/math_train/generation/lean4_random_15k/10",
|
|
|
|
|
34 |
]
|
35 |
|
36 |
# Function to extract k from the input path
|
|
|
26 |
|
27 |
# List of input paths
|
28 |
input_path_lists = [
|
29 |
+
# "/opt/tiger/formal-align/generate_result/zero_shot/lean4_random_test/generation/lean4_random_15k_rft/5",
|
30 |
+
# "/opt/tiger/formal-align/generate_result/zero_shot/lean4_basic_test/generation/lean4_random_15k_rft/5",
|
31 |
+
# "/opt/tiger/formal-align/generate_result/zero_shot/wild_test_v2/generation/lean4_random_15k_rft/5"
|
32 |
# "/opt/tiger/formal-align/generate_result/zero_shot/gsm8k_train/generation/lean4_random_15k/10",
|
33 |
# "/opt/tiger/formal-align/generate_result/zero_shot/math_train/generation/lean4_random_15k/10",
|
34 |
+
"/opt/tiger/formal-align/generate_result/zero_shot/math_train/generation/lean4_random_15k_rft/10",
|
35 |
+
"/opt/tiger/formal-align/generate_result/zero_shot/lean4_15k_train/generation/lean4_random_15k_rft/10",
|
36 |
]
|
37 |
|
38 |
# Function to extract k from the input path
|
pass_rate_new_test.py
CHANGED
@@ -204,7 +204,7 @@ def multi(command_list, output_path, k ):
|
|
204 |
# print(f"total test: {total}")
|
205 |
# print(f"Pass rate: {pass_rate}%")
|
206 |
|
207 |
-
output_file = f"output_path"
|
208 |
# Create the directory if it doesn't exist
|
209 |
os.makedirs(os.path.dirname(output_file), exist_ok=True)
|
210 |
|
|
|
204 |
# print(f"total test: {total}")
|
205 |
# print(f"Pass rate: {pass_rate}%")
|
206 |
|
207 |
+
output_file = f"{output_path}"
|
208 |
# Create the directory if it doesn't exist
|
209 |
os.makedirs(os.path.dirname(output_file), exist_ok=True)
|
210 |
|
trans_from_compile_4_training.py
CHANGED
@@ -48,7 +48,7 @@ def save_passed_results(input_list):
|
|
48 |
id_output = dedup_outputs[id]
|
49 |
if id_result.get("status") == 'pass':
|
50 |
result_dict = {
|
51 |
-
'
|
52 |
'nl_proof': proof,
|
53 |
'formal': id_output
|
54 |
}
|
|
|
48 |
id_output = dedup_outputs[id]
|
49 |
if id_result.get("status") == 'pass':
|
50 |
result_dict = {
|
51 |
+
'nl_problem': statement,
|
52 |
'nl_proof': proof,
|
53 |
'formal': id_output
|
54 |
}
|