from llm.llm import LLM from utils.utils import read_json_file, write_json_file, write_text_file, json_to_markdown, read_text_file, parse_llm_output_to_json from agent.create_charts import Chart # from utils.convert_format import markdown_to_latex import os from prompt.template import PROBLEM_EXTRACT_PROMPT if __name__ == "__main__": import glob files = glob.glob('/Users/ann/Downloads/methmatical_paper_extraction/parse/2025_*/content/*.md') llm = LLM('chatgpt-4o-latest') data = {} for file in files: year, _, _, problem_type = file.split('/')[-1].split('.')[0].split('_') problem_name = f'{year}_{problem_type}' problem_str = read_text_file(file) problem = llm.generate(PROBLEM_EXTRACT_PROMPT.format(question=problem_str), problem_str) problem = parse_llm_output_to_json(problem) # data[problem_name] = problem print(problem) write_json_file(f'/Users/ann/Documents/projects/math_modeling/data/actor_data/input/problem/{problem_name}.json', problem)