|
|
from llm.llm import LLM |
|
|
from utils.utils import read_json_file, write_json_file, write_text_file, json_to_markdown, read_text_file, parse_llm_output_to_json |
|
|
from agent.create_charts import Chart |
|
|
|
|
|
import os |
|
|
from prompt.template import PROBLEM_EXTRACT_PROMPT |
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__": |
|
|
import glob |
|
|
files = glob.glob('/Users/ann/Downloads/methmatical_paper_extraction/parse/2025_*/content/*.md') |
|
|
llm = LLM('chatgpt-4o-latest') |
|
|
data = {} |
|
|
for file in files: |
|
|
year, _, _, problem_type = file.split('/')[-1].split('.')[0].split('_') |
|
|
problem_name = f'{year}_{problem_type}' |
|
|
problem_str = read_text_file(file) |
|
|
problem = llm.generate(PROBLEM_EXTRACT_PROMPT.format(question=problem_str), problem_str) |
|
|
problem = parse_llm_output_to_json(problem) |
|
|
|
|
|
print(problem) |
|
|
write_json_file(f'/Users/ann/Documents/projects/math_modeling/data/actor_data/input/problem/{problem_name}.json', problem) |
|
|
|