amphora commited on
Commit
f229c82
Β·
verified Β·
1 Parent(s): ff41f36

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +87 -0
app.py ADDED
@@ -0,0 +1,87 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+
3
+ st.set_page_config(page_title="HAERAE Open Research Questions", layout="wide")
4
+
5
+ st.title("HAERAE Open Research Questions")
6
+
7
+ st.write("""
8
+ HAERAE is a non-profit research lab focused on the interpretability and evaluation of Korean language models.
9
+ Our mission is to advance the field with insightful benchmarks and tools. Below is an overview of our projects.
10
+
11
+ We've been doing most of our projects internally, but for those that have been unsolvable,
12
+ we are planning to open them to get help from the open-source community.
13
+ """)
14
+
15
+ st.header("HAERAE-Math Challenge")
16
+
17
+ st.write("""
18
+ Today we are introducing our first challenge: HAERAE-Math. We've created high-quality instructions on math
19
+ but don't have an idea on how to generate high-quality answers for them. We are looking for solutions that
20
+ use open-source models with openly available licenses.
21
+
22
+ We have created a total of 20,000 instructions already and are generating more. We've opened up a preview
23
+ of 50 of them in this link: [HAERAE-Math Samples](https://huggingface.co/datasets/HAERAE-HUB/HAERAE-Math-samples)
24
+
25
+ For those who generate answers for the 50 and share the methodology/results with us, we'll share the
26
+ remaining instructions and credit for the resulting dataset.
27
+ """)
28
+
29
+ st.subheader("Example Question")
30
+
31
+ example_question = """
32
+ ν•œκ΅­μ˜ λ³΄μ•ˆ μ „λ¬Έκ°€κ°€ κ³ λ„ν™”λœ 데이터 보호 μ‹œμŠ€ν…œμ„ κ°œλ°œν•˜κ³  μžˆμŠ΅λ‹ˆλ‹€. 이 μ‹œμŠ€ν…œμ€ 3차원 κΈ°ν•˜ν•™μ  잠금 λ©”μ»€λ‹ˆμ¦˜μ„ μ‚¬μš©ν•˜λŠ”λ°, 잠금 μž₯μΉ˜λŠ” 원뿔 λͺ¨μ–‘μœΌλ‘œ λ˜μ–΄ 있고, λ°‘λ©΄μ˜ λ°˜μ§€λ¦„μ€ 6cm, λ†’μ΄λŠ” 8cmμž…λ‹ˆλ‹€. 이 원뿔 λͺ¨μ–‘μ˜ 잠금 μž₯μΉ˜μ—λŠ” 원톡 λͺ¨μ–‘μ˜ μ—΄μ‡ κ°€ λ”± 맞게 λ“€μ–΄κ°€κ²Œ μ„€κ³„λ˜μ–΄ μžˆμŠ΅λ‹ˆλ‹€.
33
+
34
+ λ³΄μ•ˆ μ „λ¬Έκ°€λŠ” 더 높은 μˆ˜μ€€μ˜ λ³΄μ•ˆμ„ μœ„ν•΄ 원톡 λͺ¨μ–‘μ˜ μ—΄μ‡  μ•ˆμ— ꡬ λͺ¨μ–‘μ˜ 잠금 μž₯치λ₯Ό μΆ”κ°€ν•˜λ €κ³  ν•©λ‹ˆλ‹€. 이 κ΅¬λŠ” 원톡 μ•ˆμ— λ”± 듀어가도둝 μ„€κ³„λ˜μ–΄ μžˆμŠ΅λ‹ˆλ‹€.
35
+
36
+ λ‹€μŒμ˜ μ§ˆλ¬Έλ“€μ„ ν•΄κ²°ν•˜μ‹œκΈ° λ°”λžλ‹ˆλ‹€:
37
+
38
+ 1. 원뿔 μ•ˆμ— λ”± λ“€μ–΄κ°€κ²Œ μ„€κ³„λœ μ›ν†΅μ˜ λ°˜μ§€λ¦„μ€ μ–Όλ§ˆμΈκ°€μš”?
39
+ 2. 원톡 μ•ˆμ— λ”± λ“€μ–΄κ°€κ²Œ μ„€κ³„λœ ꡬ의 λΆ€ν”ΌλŠ” μ–Όλ§ˆμΈκ°€μš”?
40
+ 3. 원뿔, 원톡, ꡬ가 λͺ¨λ‘ 같은 쀑심좕을 κ³΅μœ ν•˜κ³  있으며 μ›λΏ”μ˜ κΌ­λŒ€κΈ°μ κ³Ό 원톡, ꡬ의 쀑심점이 λ™μΌν•˜λ‹€κ³  κ°€μ •ν•˜λ©΄, μ›λΏ”μ—μ„œ 원톡이 μ°¨μ§€ν•˜λŠ” λΉ„μœ¨μ„ κ΅¬ν•˜μ‹œμ˜€.
41
+ 4. 이제 μ›λΏ”μ˜ 높이λ₯Ό 2배둜 늘리자. μ›λΏ”μ˜ 높이가 16cmκ°€ λ˜μ—ˆμ„ λ•Œ, 원톡과 ꡬ의 크기와 λΆ€ν”ΌλŠ” μ–΄λ–»κ²Œ λ³€ν•˜λ‚˜μš”?
42
+ 5. μ›λΏ”μ˜ 높이와 λ°‘λ©΄μ˜ λ°˜μ§€λ¦„μ„ 각각 h와 r이라고 ν•  λ•Œ, 원톡과 ꡬ의 μ΅œλŒ€ λΆ€ν”Όλ₯Ό rκ³Ό h둜 ν‘œν˜„ν•˜μ‹œμ˜€.
43
+
44
+ 원뿔, 원톡, ꡬ의 λΆ€ν”Ό 곡식을 μ‚¬μš©ν•˜μ—¬ 문제λ₯Ό ν•΄κ²°ν•˜μ‹œκΈ° λ°”λžλ‹ˆλ‹€:
45
+
46
+ μ›λΏ”μ˜ λΆ€ν”Ό: V = 1/3Ο€rΒ²h
47
+ μ›ν†΅μ˜ λΆ€ν”Ό: V = Ο€rΒ²h
48
+ ꡬ의 λΆ€ν”Ό: V = 4/3Ο€rΒ³
49
+ """
50
+
51
+ st.code(example_question, language="markdown")
52
+
53
+ st.header("How to Participate")
54
+
55
+ st.write("""
56
+ 1. Access the 50 sample questions from the provided Hugging Face dataset link.
57
+ 2. Generate high-quality answers for these questions using open-source models.
58
+ 3. Document your methodology and results.
59
+ 4. Share your findings with us through [contact information or submission form].
60
+ 5. If your approach is promising, we'll provide access to the full dataset of 20,000 instructions.
61
+ 6. Collaborate with us to refine and improve the answer generation process.
62
+ 7. Receive credit as a contributor to the final HAERAE-Math dataset.
63
+ """)
64
+
65
+ st.header("Why Participate?")
66
+
67
+ st.write("""
68
+ - Contribute to advancing Korean language model research
69
+ - Gain access to a large, high-quality dataset of math instructions
70
+ - Collaborate with HAERAE researchers
71
+ - Receive recognition in the field of NLP and math education
72
+ - Potential for co-authorship on related publications
73
+ """)
74
+
75
+ st.header("Contact Us")
76
+
77
+ st.write("""
78
+ For more information or to submit your results, please contact us at:
79
+ [Your contact information or a link to a submission form]
80
+ """)
81
+
82
+ st.sidebar.title("About HAERAE")
83
+ st.sidebar.info("""
84
+ HAERAE is a non-profit research lab dedicated to advancing the field of
85
+ Korean language model interpretability and evaluation. Our work focuses on
86
+ creating insightful benchmarks and tools to push the boundaries of NLP research.
87
+ """)