Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -2,16 +2,18 @@ import streamlit as st
|
|
2 |
|
3 |
st.set_page_config(page_title="HAERAE Open Research Questions", layout="wide")
|
4 |
|
5 |
-
#
|
|
|
|
|
|
|
6 |
lang = st.radio("Language / ์ธ์ด", ["English", "ํ๊ตญ์ด"])
|
7 |
|
8 |
# Content in both languages
|
9 |
content = {
|
10 |
"English": {
|
11 |
-
"title": "HAERAE Open Research Questions",
|
12 |
"intro": """
|
13 |
HAERAE is a non-profit research lab focused on the interpretability and evaluation of Korean language models.
|
14 |
-
Our mission is to advance the field with insightful benchmarks and tools.
|
15 |
|
16 |
We've been doing most of our projects internally, but for those that have been unsolvable,
|
17 |
we are planning to open them to get help from the open-source community.
|
@@ -36,15 +38,12 @@ content = {
|
|
36 |
3. Document your methodology and results.
|
37 |
4. Share your findings with us through [contact information or submission form].
|
38 |
5. If your approach is promising, we'll provide access to the full dataset of 20,000 instructions.
|
39 |
-
6. Collaborate with us to refine and improve the answer generation process.
|
40 |
-
7. Receive credit as a contributor to the final HAERAE-Math dataset.
|
41 |
""",
|
42 |
"why_title": "Why Participate?",
|
43 |
"why": """
|
44 |
- Contribute to advancing Korean language model research
|
45 |
- Gain access to a large, high-quality dataset of math instructions
|
46 |
- Collaborate with HAERAE researchers
|
47 |
-
- Receive recognition in the field of NLP and math education
|
48 |
- Potential for co-authorship on related publications
|
49 |
""",
|
50 |
"contact_title": "Contact Us",
|
@@ -60,43 +59,40 @@ content = {
|
|
60 |
"""
|
61 |
},
|
62 |
"ํ๊ตญ์ด": {
|
63 |
-
"title": "HAERAE ๊ณต๊ฐ ์ฐ๊ตฌ ์ง๋ฌธ",
|
64 |
"intro": """
|
65 |
-
HAERAE๋ ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ์
|
66 |
-
|
67 |
|
68 |
-
๋๋ถ๋ถ์ ํ๋ก์ ํธ๋ฅผ ๋ด๋ถ์ ์ผ๋ก ์ํํด ์์ง๋ง, ํด๊ฒฐํ๊ธฐ ์ด๋ ค์ด ๋ฌธ์ ๋ค์ ๋ํด์๋
|
69 |
-
์คํ ์์ค ์ปค๋ฎค๋ํฐ์ ๋์์ ๋ฐ๊ณ ์
|
70 |
""",
|
71 |
-
"challenge_title": "HAERAE-Math
|
72 |
"challenge_desc": """
|
73 |
-
|
74 |
-
|
75 |
-
|
76 |
|
77 |
-
|
78 |
-
๋ค์ ๋งํฌ์์
|
|
|
79 |
|
80 |
-
50๊ฐ์ ๋ํ ๋ต๋ณ์ ์์ฑํ๊ณ ๋ฐฉ๋ฒ๋ก /๊ฒฐ๊ณผ๋ฅผ
|
81 |
-
|
82 |
""",
|
83 |
"example_title": "์์ ์ง๋ฌธ",
|
84 |
"how_to_title": "์ฐธ์ฌ ๋ฐฉ๋ฒ",
|
85 |
"how_to": """
|
86 |
-
1. ์ ๊ณต๋ Hugging Face ๋ฐ์ดํฐ์
๋งํฌ์์ 50๊ฐ์ ์ํ
|
87 |
2. ์คํ ์์ค ๋ชจ๋ธ์ ์ฌ์ฉํ์ฌ ์ด ์ง๋ฌธ๋ค์ ๋ํ ๊ณ ํ์ง ๋ต๋ณ์ ์์ฑํฉ๋๋ค.
|
88 |
3. ๋ฐฉ๋ฒ๋ก ๊ณผ ๊ฒฐ๊ณผ๋ฅผ ๋ฌธ์ํํฉ๋๋ค.
|
89 |
-
4. [์ฐ๋ฝ์ฒ ์ ๋ณด ๋๋ ์ ์ถ ์์]์ ํตํด ๊ทํ์ ๊ฒฐ๊ณผ๋ฅผ
|
90 |
-
5. ๊ทํ์ ์ ๊ทผ ๋ฐฉ์์ด
|
91 |
-
6. ๋ต๋ณ ์์ฑ ๊ณผ์ ์ ๊ฐ์ ํ๊ณ ๋ฐ์ ์ํค๊ธฐ ์ํด ์ฐ๋ฆฌ์ ํ๋ ฅํฉ๋๋ค.
|
92 |
-
7. ์ต์ข
HAERAE-Math ๋ฐ์ดํฐ์
์ ๊ธฐ์ฌ์๋ก ์ธ์ ๋ฐ์ต๋๋ค.
|
93 |
""",
|
94 |
"why_title": "์ ์ฐธ์ฌํด์ผ ํ๋์?",
|
95 |
"why": """
|
96 |
- ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ ์ฐ๊ตฌ ๋ฐ์ ์ ๊ธฐ์ฌ
|
97 |
- ๋๊ท๋ชจ์ ๊ณ ํ์ง ์ํ ์ง์๋ฌธ ๋ฐ์ดํฐ์
์ ์ ๊ทผ
|
98 |
- HAERAE ์ฐ๊ตฌ์๋ค๊ณผ ํ๋ ฅ
|
99 |
-
- NLP ๋ฐ ์ํ ๊ต์ก ๋ถ์ผ์์ ์ธ์ ๋ฐ์ ๊ธฐํ
|
100 |
- ๊ด๋ จ ์ถํ๋ฌผ์ ๊ณต๋ ์ ์๊ฐ ๋ ๊ฐ๋ฅ์ฑ
|
101 |
""",
|
102 |
"contact_title": "์ฐ๋ฝ์ฒ",
|
@@ -106,15 +102,13 @@ content = {
|
|
106 |
""",
|
107 |
"sidebar_title": "HAERAE ์๊ฐ",
|
108 |
"sidebar_content": """
|
109 |
-
HAERAE๋ ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ์
|
110 |
-
|
111 |
"""
|
112 |
}
|
113 |
}
|
114 |
|
115 |
# Main content
|
116 |
-
st.title(content[lang]["title"])
|
117 |
-
|
118 |
st.write(content[lang]["intro"])
|
119 |
|
120 |
st.header(content[lang]["challenge_title"])
|
|
|
2 |
|
3 |
st.set_page_config(page_title="HAERAE Open Research Questions", layout="wide")
|
4 |
|
5 |
+
# Title (always in English)
|
6 |
+
st.title("HAERAE Open Research Questions")
|
7 |
+
|
8 |
+
# Language selection below the title
|
9 |
lang = st.radio("Language / ์ธ์ด", ["English", "ํ๊ตญ์ด"])
|
10 |
|
11 |
# Content in both languages
|
12 |
content = {
|
13 |
"English": {
|
|
|
14 |
"intro": """
|
15 |
HAERAE is a non-profit research lab focused on the interpretability and evaluation of Korean language models.
|
16 |
+
Our mission is to advance the field with insightful benchmarks and tools.
|
17 |
|
18 |
We've been doing most of our projects internally, but for those that have been unsolvable,
|
19 |
we are planning to open them to get help from the open-source community.
|
|
|
38 |
3. Document your methodology and results.
|
39 |
4. Share your findings with us through [contact information or submission form].
|
40 |
5. If your approach is promising, we'll provide access to the full dataset of 20,000 instructions.
|
|
|
|
|
41 |
""",
|
42 |
"why_title": "Why Participate?",
|
43 |
"why": """
|
44 |
- Contribute to advancing Korean language model research
|
45 |
- Gain access to a large, high-quality dataset of math instructions
|
46 |
- Collaborate with HAERAE researchers
|
|
|
47 |
- Potential for co-authorship on related publications
|
48 |
""",
|
49 |
"contact_title": "Contact Us",
|
|
|
59 |
"""
|
60 |
},
|
61 |
"ํ๊ตญ์ด": {
|
|
|
62 |
"intro": """
|
63 |
+
HAERAE๋ ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ์ ํด์๊ณผ ํ๊ฐ์ ์ฐ๊ตฌ๋ฅผ ์ํด ์ค๋ฆฝ๋ ๋น์๋ฆฌ ์ฐ๊ตฌํ์
๋๋ค.
|
64 |
+
์ ํฌ๋ ๋ค์ํ ๋ฒค์น๋งํฌ์ ์ฐ๊ตฌ๋ฅผ ํตํด ํ๊ตญ์ด ์์ฐ์ด ์ฒ๋ฆฌ ์ฐ๊ตฌ๋ฅผ ๋ฐ์ ์ํค๊ธฐ ์ํด ๋
ธ๋ ฅํ๊ณ ์์ต๋๋ค.
|
65 |
|
66 |
+
๊ธฐ์กด์๋ ๋๋ถ๋ถ์ ํ๋ก์ ํธ๋ฅผ ๋ด๋ถ์ ์ผ๋ก ์ํํด ์์ง๋ง, ๋ด๋ถ์ ์ผ๋ก ํด๊ฒฐํ๊ธฐ ์ด๋ ค์ด ๋ฌธ์ ๋ค์ ๋ํด์๋
|
67 |
+
์คํ ์์ค ์ปค๋ฎค๋ํฐ์ ๋์์ ๋ฐ๊ณ ์ Open-Research-Question ํ๋ก๊ทธ๋จ์ ์ด์ํ๊ฒ ๋์์ต๋๋ค.
|
68 |
""",
|
69 |
+
"challenge_title": "HAERAE-Math Challenge",
|
70 |
"challenge_desc": """
|
71 |
+
์ ํฌ ํ์ [QARV-Instruct](https://huggingface.co/datasets/HAERAE-HUB/qarv-instruct-ko) ๋ถํฐ ์์ํด์ ๊ณ ํ์ง์ ํ๊ตญ์ด ์ง์๋ฌธ ๋ฐ์ดํฐ๋ฅผ
|
72 |
+
๋ง๋ค๊ธฐ ์ํด ๋
ธ๋ ฅ ์ค์ ์์ต๋๋ค. ์ด ๊ณผ์ ์์ ๋งค์ฐ ๋์ ์์ค์ ์ํ ์ง์๋ฌธ์ ์ ์ํ์์ผ๋, ํด๋น ์ง์๋ฌธ์ ๋ํด ์ ์ ํ ๋ต๋ณ์ ๋ง๋ค์ง ๋ชปํ๊ณ ์์ต๋๋ค.
|
73 |
+
์ ํฌ๋ ์ด๋ฒ ์ฑ๋ฆฐ์ง๋ฅผ ํตํด ์คํ์์ค LLM์ ์ฌ์ฉํ์ฌ ํด๋น ๋ฌธ์ ๋ค์ ๋ํ ๋ต์ ์ ์ํ ์ ์๋ ์๋ฃจ์
์ ์ฐพ๊ณ ์์ต๋๋ค.
|
74 |
|
75 |
+
ํ์ฌ๋ ์ด 20,000๊ฐ์ ์ง์๋ฌธ์ ์ด๋ฏธ ๋ง๋ค์์ผ๋ฉฐ ์ถ๊ฐ์ ์ผ๋ก ์์ฑํ๋ ๊ณผ์ ์ค์ ์์ต๋๋ค.
|
76 |
+
์์ฑ๋ ์ง์๋ฌธ ์ค ๋๋ค์ผ๋ก ์ํ๋ง๋ 50๊ฐ์ ์ง๋ฌธ์ ๋ค์ ๋งํฌ์์ ๋ณด์ค ์ ์์ต๋๋ค.
|
77 |
+
[HAERAE-Math ์ํ](https://huggingface.co/datasets/HAERAE-HUB/HAERAE-Math-samples)
|
78 |
|
79 |
+
50๊ฐ์ ๋ํ ๋ต๋ณ์ ์์ฑํ๊ณ ๋ฐฉ๋ฒ๋ก /๊ฒฐ๊ณผ๋ฅผ ์ ํฌ์๊ฒ ๊ณต์ ํด์ฃผ๏ฟฝ๏ฟฝ๏ฟฝ๋ ๋ถ๋ค๊ผ ์ ํฌ๊ฐ ์์ฑํ ์ ์ฒด ์ง์๋ฌธ๊ณผ ์ต์ข
๋ฐ์ดํฐ์
์ ๋ํ ๊ธฐ์ฌ๋๋ฅผ ์ธ์ ํด๋๋ฆด ์์ ์
๋๋ค.
|
80 |
+
(๊ฒฐ๊ณผ์ ๋ฐ๋ผ ๋
ผ๋ฌธํ๋ ๊ณ ๋ฏผ ์ค์ ์์ต๋๋ค.)
|
81 |
""",
|
82 |
"example_title": "์์ ์ง๋ฌธ",
|
83 |
"how_to_title": "์ฐธ์ฌ ๋ฐฉ๋ฒ",
|
84 |
"how_to": """
|
85 |
+
1. ์ ๊ณต๋ Hugging Face ๋ฐ์ดํฐ์
๋งํฌ์์ 50๊ฐ์ ์ํ ์ง๋ฌธ์ ํ์ธํฉ๋๋ค.
|
86 |
2. ์คํ ์์ค ๋ชจ๋ธ์ ์ฌ์ฉํ์ฌ ์ด ์ง๋ฌธ๋ค์ ๋ํ ๊ณ ํ์ง ๋ต๋ณ์ ์์ฑํฉ๋๋ค.
|
87 |
3. ๋ฐฉ๋ฒ๋ก ๊ณผ ๊ฒฐ๊ณผ๋ฅผ ๋ฌธ์ํํฉ๋๋ค.
|
88 |
+
4. [์ฐ๋ฝ์ฒ ์ ๋ณด ๋๋ ์ ์ถ ์์]์ ํตํด ๊ทํ์ ๊ฒฐ๊ณผ๋ฅผ ์ ํฌ์ ๊ณต์ ํฉ๋๋ค.
|
89 |
+
5. ๊ทํ์ ์ ๊ทผ ๋ฐฉ์์ด ์ ์๋ฏธ ํ๋ค๊ณ ํ๋จ ๋๋ค๋ฉด, ๋๋จธ์ง ์ง์๋ฌธ ๋ฐ์ดํฐ์
์ ๋ํ ์ ๊ทผ ๊ถํ์ ์ ๊ณตํด ๋๋ฆฝ๋๋ค.
|
|
|
|
|
90 |
""",
|
91 |
"why_title": "์ ์ฐธ์ฌํด์ผ ํ๋์?",
|
92 |
"why": """
|
93 |
- ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ ์ฐ๊ตฌ ๋ฐ์ ์ ๊ธฐ์ฌ
|
94 |
- ๋๊ท๋ชจ์ ๊ณ ํ์ง ์ํ ์ง์๋ฌธ ๋ฐ์ดํฐ์
์ ์ ๊ทผ
|
95 |
- HAERAE ์ฐ๊ตฌ์๋ค๊ณผ ํ๋ ฅ
|
|
|
96 |
- ๊ด๋ จ ์ถํ๋ฌผ์ ๊ณต๋ ์ ์๊ฐ ๋ ๊ฐ๋ฅ์ฑ
|
97 |
""",
|
98 |
"contact_title": "์ฐ๋ฝ์ฒ",
|
|
|
102 |
""",
|
103 |
"sidebar_title": "HAERAE ์๊ฐ",
|
104 |
"sidebar_content": """
|
105 |
+
HAERAE๋ ํ๊ตญ์ด ์ธ์ด ๋ชจ๋ธ์ ํด์๊ณผ ํ๊ฐ์ ์ฐ๊ตฌ๋ฅผ ์ํด ์ค๋ฆฝ๋ ๋น์๋ฆฌ ์ฐ๊ตฌํ์
๋๋ค.
|
106 |
+
์ ํฌ๋ ๋ค์ํ ๋ฒค์น๋งํฌ์ ์ฐ๊ตฌ๋ฅผ ํตํด ํ๊ตญ์ด ์์ฐ์ด ์ฒ๋ฆฌ ์ฐ๊ตฌ๋ฅผ ๋ฐ์ ์ํค๊ธฐ ์ํด ๋
ธ๋ ฅํ๊ณ ์์ต๋๋ค.
|
107 |
"""
|
108 |
}
|
109 |
}
|
110 |
|
111 |
# Main content
|
|
|
|
|
112 |
st.write(content[lang]["intro"])
|
113 |
|
114 |
st.header(content[lang]["challenge_title"])
|