File tree
1,121 files changed
+1565905
-9643258
lines changed- Question
- LLM
- __pycache__
- Questions
- __pycache__
- q10
- __pycache__
- q11
- __pycache__
- q12
- __pycache__
- q13
- __pycache__
- q14
- __pycache__
- q15
- __pycache__
- q16
- __pycache__
- q17
- __pycache__
- q18
- __pycache__
- q19
- __pycache__
- q1
- __pycache__
- q20
- __pycache__
- q21
- __pycache__
- q22
- __pycache__
- q23
- __pycache__
- q24
- __pycache__
- q25
- __pycache__
- q26
- __pycache__
- q27
- __pycache__
- q28
- __pycache__
- q29
- __pycache__
- q2
- __pycache__
- q30
- __pycache__
- q31
- __pycache__
- q32
- __pycache__
- q33
- q34
- __pycache__
- q35
- __pycache__
- q36
- __pycache__
- q37
- __pycache__
- q38
- __pycache__
- q39
- __pycache__
- q3
- __pycache__
- q40
- __pycache__
- q41
- __pycache__
- q42
- __pycache__
- q43
- __pycache__
- q44
- __pycache__
- q45
- __pycache__
- q46
- __pycache__
- q47
- __pycache__
- q48
- __pycache__
- q49
- __pycache__
- q4
- __pycache__
- q50
- __pycache__
- q51
- __pycache__
- q52
- __pycache__
- q53
- __pycache__
- q55
- __pycache__
- q56
- __pycache__
- q57
- __pycache__
- q58
- q59
- __pycache__
- q5
- q60
- __pycache__
- q61
- __pycache__
- q62
- __pycache__
- q63
- __pycache__
- q64
- __pycache__
- q65
- __pycache__
- q66
- __pycache__
- q67
- __pycache__
- q68
- __pycache__
- q69
- __pycache__
- q6
- __pycache__
- q70
- __pycache__
- q71
- __pycache__
- q72
- __pycache__
- q73
- __pycache__
- q74
- __pycache__
- q75
- __pycache__
- q76
- __pycache__
- q77
- __pycache__
- q78
- q79
- __pycache__
- q7
- __pycache__
- q80
- __pycache__
- q8
- __pycache__
- q9
- __pycache__
- q_exmaple
- __pycache__
- generated_datasets
- Results
- DeepSeek-V3-4K/2025-01-19_11-17-16_deepseek_v3_i1-50_4K
- Deepseek-V3-8K
- Deepseek_R1
- GPT-4o-mini
- GPT-4o
- GPT-o1
- Llama-3.1-405B-Instruct-Turbo
- Llama-3.3-70B-Instruct
- QwQ-32B-Preview_16K
- QwQ-32B-Preview_32K_original_precision
- QwQ-32B-Preview_32K_ultra_precision
- QwQ-32B-Preview_32K
- QwQ-32B-Preview_4K
- QwQ-32B-Preview_8K
- Qwen2.5-32B-Instruct
- Qwen2.5-3B-Instruct
- Qwen2.5-72B-Instruct-Turbo_old
- Qwen2.5-72B-Instruct-Turbo
- Qwen2.5-7B-Instruct-original-precision
- Qwen2.5-7B-Instruct-ultra-precision
- Qwen2.5-7B-Instruct
- Qwen2.5-Math-1.5B-Instruct
- Qwen2.5-Math-72B-Instruct
- Qwen2.5-Math-7B-Instruct-original-precision
- Qwen2.5-Math-7B-Instruct-ultra-precision
- Qwen2.5-Math-7B-Instruct
- climategpt-70b
- climategpt-7b_4K
- deepseek-math-7b-instruct
- deepseek-math-7b-rl
- gemini-2.0-flash-exp
- gemini-2.0-flash-thinking-exp-01-21_30K-original-precision
- gemini-2.0-flash-thinking-exp-01-21_30K-ultra-precision
- gemini-2.0-flash-thinking-exp-01-21_30K
- gemini-2.0-flash-thinking-exp-01-21_8K
- gemini-2.0-flash-thinking-exp-12-19_30K
- gemini-2.0-flash-thinking-exp-12-19_8K
- gemma-2-27b-it
- gemma-2-9b-it
- data
- csv
- jsonl
- docs
- doc
- croissant
- images
- mcq_gen_framework
- extra
- q100
- q101
- q102
- q103
- q104
- q75
- q76
- q77
- q78
- q79
- q80
- q81
- q82
- q83
- q84
- q85
- q86
- q87
- q88
- q89
- q90
- q91
- q92
- q93
- q94
- q95
- q96
- q97
- q98
- q99
- main
- q10
- q11
- q12
- q13
- q14
- q15
- q16
- q17
- q18
- q19
- q1
- q20
- q21
- q22
- q23
- q24
- q25
- q26
- q27
- q28
- q29
- q2
- q30
- q31
- q32
- q33
- q34
- q35
- q36
- q37
- q38
- q39
- q3
- q40
- q41
- q42
- q43
- q44
- q45
- q46
- q47
- q48
- q49
- q4
- q50
- q51
- q52
- q53
- q54
- q55
- q56
- q57
- q58
- q59
- q60
- q61
- q62
- q63
- q64
- q65
- q66
- q67
- q68
- q69
- q6
- q70
- q71
- q72
- q73
- q74
- q75
- q76
- q77
- q78
- q79
- q7
- q80
- q8
- q9
- output
- scripts
- output
- MCQ
- extra_1-10
- deepseek-r1-8000
- deepseek-v3-8000
- google-GeminiModel-30000
- google-gemini-2.0-flash-exp-8000
- google-gemini-2.0-flash-thinking-exp-01-21-30000
- huggingface-Qwen2.5-72B-GeoGPT-8000
- huggingface-gemma-2-9b-it-8000
- openai-gpt4o-8000
- openai-gpt4o-mini-8000
- openai-o1-30000
- openai-o3-mini-30000
- openai-o3-mini-8000
- together-Llama-3.1-405B-Instruct-Turbo-8000
- together-Llama-3.3-70B-Instruct-8000
- together-QwQ-32B-Preview-30000
- together-Qwen2.5-72B-GeoGPT-8000
- together-Qwen2.5-72B-Instruct-Turbo-8000
- together-Qwen2.5-7B-Instruct-Turbo-8000
- together-Qwen3-235B-A22B-fp8-tput-30000
- main_1-10
- deepseek-r1-8000
- deepseek-v3-8000
- google-gemini-2.0-flash-exp-8000
- google-gemini-2.0-flash-thinking-exp-01-21-30000
- google-gemini-2.0-flash-thinking-exp-01-21-8000
- google-gemini-2.0-flash-thinking-exp-12-19-30000
- google-gemini-2.0-flash-thinking-exp-12-19-8000
- huggingface-Llama-3.3-70B-Instruct-8000
- huggingface-Qwen2.5-32B-Instruct-8000
- huggingface-Qwen2.5-3B-Instruct-8000
- huggingface-Qwen2.5-72B-GeoGPT-8000
- huggingface-Qwen2.5-7B-Instruct-8000
- huggingface-Qwen2.5-Coder-32B-Instruct-8000
- huggingface-Qwen2.5-Math-1.5B-Instruct-8000
- huggingface-Qwen2.5-Math-72B-Instruct-8000
- huggingface-Qwen2.5-Math-7B-Instruct-8000
- huggingface-climategpt-70b-4000
- huggingface-climategpt-7b-4000
- huggingface-deepseek-math-7b-instruct-8000
- huggingface-deepseek-math-7b-rl-8000
- huggingface-gemma-2-27b-it-8000
- huggingface-gemma-2-9b-it-8000
- openai-gpt4o-8000
- openai-gpt4o-mini-8000
- openai-gpto1-30000
- openai-o3-mini-16000
- openai-o3-mini-30000
- openai-o3-mini-40000
- openai-o3-mini-4000
- openai-o3-mini-8000
- together-DeepSeek-R1-Distill-Llama-70B-16000
- together-DeepSeek-R1-Distill-Llama-70B-30000
- together-DeepSeek-R1-Distill-Llama-70B-4000
- together-DeepSeek-R1-Distill-Llama-70B-8000
- together-Llama-3.1-405B-Instruct-Turbo-8000
- together-QwQ-32B-Preview-16000
- together-QwQ-32B-Preview-30000
- together-QwQ-32B-Preview-4000
- together-QwQ-32B-Preview-8000
- together-Qwen2.5-72B-Instruct-Turbo-8000
- together-Qwen3-235B-A22B-fp8-tput-30000
- OEQ/oeq
- deepseek-r1-8000
- deepseek-v3-8000
- google-GeminiModel-30000
- google-gemini-2.0-flash-exp-8000
- google-gemini-2.0-flash-thinking-exp-01-21-30000
- huggingface-Qwen2.5-3B-Instruct-8000
- huggingface-Qwen2.5-72B-GeoGPT-8000
- huggingface-gemma-2-9b-it-4096
- huggingface-gemma-2-9b-it-512
- huggingface-gemma-2-9b-it-8000
- openai-gpt4o-8000
- openai-gpt4o-mini-8000
- openai-o1-30000
- openai-o3-mini-30000
- openai-o3-mini-8000
- together-Llama-3.1-405B-Instruct-Turbo-8000
- together-Llama-3.3-70B-Instruct-8000
- together-QwQ-32B-Preview-30000
- together-Qwen2.5-72B-GeoGPT-8000
- together-Qwen2.5-72B-Instruct-Turbo-8000
- together-Qwen2.5-7B-Instruct-Turbo-8000
- together-Qwen3-235B-A22B-fp8-tput-30000
- scripts
- analysis
- evaluate
- exp
- Deepseek_R1
- QwQ-32B-Preview_32K
- gemini-2.0-flash-thinking-exp-01-21_30K
- o3-mini-30K
- output_plots
- generate_api
- generate_gpu
- instance_analysis
- src
- evaluate
- evaluators
- generate
- models
- type
Some content is hidden
Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
1,121 files changed
+1565905
-9643258
lines changedBinary file not shown.
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
| 1 | + | |
| 2 | + | |
| 3 | + | |
| 4 | + | |
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
| 1 | + | |
| 2 | + | |
| 3 | + | |
| 4 | + | |
| 5 | + | |
| 6 | + | |
| 7 | + | |
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
1 | 1 | | |
2 | 2 | | |
3 | | - | |
| 3 | + | |
4 | 4 | | |
5 | 5 | | |
6 | 6 | | |
| |||
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
0 commit comments