File size: 1,045 Bytes
8496edd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from llm.llm import LLM
from utils.utils import read_json_file, write_json_file, write_text_file, json_to_markdown, read_text_file, parse_llm_output_to_json
from agent.create_charts import Chart
# from utils.convert_format import markdown_to_latex
import os
from prompt.template import PROBLEM_EXTRACT_PROMPT



if __name__ == "__main__":
    import glob
    files = glob.glob('/Users/ann/Downloads/methmatical_paper_extraction/parse/2025_*/content/*.md')
    llm = LLM('chatgpt-4o-latest')
    data = {}
    for file in files:
        year, _, _, problem_type = file.split('/')[-1].split('.')[0].split('_')
        problem_name = f'{year}_{problem_type}'
        problem_str = read_text_file(file)    
        problem = llm.generate(PROBLEM_EXTRACT_PROMPT.format(question=problem_str), problem_str)
        problem = parse_llm_output_to_json(problem)
        # data[problem_name] = problem
        print(problem)
        write_json_file(f'/Users/ann/Documents/projects/math_modeling/data/actor_data/input/problem/{problem_name}.json', problem)