File size: 954 Bytes
8e59f09
 
 
382e2e7
8e59f09
 
 
382e2e7
8e59f09
 
 
 
382e2e7
e8bf2aa
 
8e59f09
 
e8bf2aa
8e59f09
e8bf2aa
8e59f09
e8bf2aa
8e59f09
e8bf2aa
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
import json
import re

def process_json_files(start, end):
    base_path = "texts"
    results = []

    for i in range(start, end + 1):
        file_name = f"{base_path}/{i:02}.json"
        try:
            with open(file_name, 'r', encoding='utf-8') as file:
                data = json.load(file)
                if data:
                    # Return a tuple of book_id and text data
                    results.append((i, {"title": data.get("title", "No title"), "text": data.get("text", [])}))

        except FileNotFoundError:
            results.append((i, {"error": f"File {file_name} not found."}))  # Use a tuple here
        except json.JSONDecodeError as e:
            results.append((i, {"error": f"File {file_name} could not be read as JSON: {e}"}))  # Use a tuple here
        except KeyError as e:
            results.append((i, {"error": f"Expected key 'text' is missing in {file_name}: {e}"}))  # Use a tuple here

    return results