File size: 2,335 Bytes
1852be7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a84d3eb
1852be7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
357d882
 
a84d3eb
0b76458
357d882
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
import json
import os
import base64
import streamlit as st

FIELDS = [
    "CodeValue",
    "CodeType",
    "Context",
    "Question",
    "AnswerText",
    "UpVoteCount",
    "DownVoteCount",
    "VoteComment",
]

IO_PATTERN = "*.jsonl"


def read_jsonl_file(file_path):
    if not os.path.exists(file_path):
        return []
    with open(file_path, "r") as f:
        lines = f.readlines()
    records = [json.loads(line) for line in lines]
    return records


def write_jsonl_file(file_path, records):
    with open(file_path, "w") as f:
        for record in records:
            f.write(json.dumps(record) + "\n")


def list_files():
    return [f for f in os.listdir() if f.endswith(".jsonl")]


def download_link(file_path):
    with open(file_path, "rb") as f:
        contents = f.read()
    b64 = base64.b64encode(contents).decode()
    href = f'<a href="data:application/octet-stream;base64,{b64}" download="{file_path}">Download</a>'
    return href


def main():
    jsonl_files = list_files()

    if not jsonl_files:
        st.warning("No JSONL files found. Creating new file.")
        jsonl_files.append("data.jsonl")
        write_jsonl_file("data.jsonl", [])

    selected_file = st.sidebar.text_input("Enter file name", value=jsonl_files[0])
    if selected_file != jsonl_files[0]:
        os.rename(jsonl_files[0], selected_file)
        jsonl_files[0] = selected_file

    st.sidebar.write("JSONL files:")
    selected_file_index = st.sidebar.selectbox("", range(len(jsonl_files)))
    for i, file_name in enumerate(jsonl_files):
        if i == selected_file_index:
            selected_file = file_name
            st.sidebar.write(f"> {file_name}")
        else:
            st.sidebar.write(file_name)

    st.sidebar.markdown(download_link(selected_file), unsafe_allow_html=True)

    records = read_jsonl_file(selected_file)

    for field in FIELDS:
        value = st.text_input(field, key=field)
        st.write(f"{field}: {value}")

    if st.button("Add Record"):
        record = {field: st.session_state[field] for field in FIELDS}
        records.append(record)
        write_jsonl_file(selected_file, records)
        st.success("Record added!")

    st.write(f"Current contents of {selected_file}:")
    for record in records:
        st.write(record)


if __name__ == "__main__":
    main()