paperfetch/llm.py at main · Soldatov-Lab/paperfetch · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
import asyncio
import ast
from openai import AsyncOpenAI
import httpx


def create_llm_client(config):
    """Create and return an AsyncOpenAI client with the given configuration."""
    return AsyncOpenAI(
        base_url=config['api']['openai_url'],
        api_key=config['api']['openai_api'],
        http_client = httpx.AsyncClient(verify=config['api'].get('ssl_verify', True))
    )


async def process_papers_with_llm(papers_with_abstracts, query, client, config):
    """
    Process papers using LLM for summarization and interest rating concurrently.

    Args:
        papers_with_abstracts (dict): Dictionary of paper titles and abstracts
        query (str): Search query for relevance rating
        client: AsyncOpenAI client instance
        config (dict): Configuration dictionary

    Returns:
        dict: Processed results with summaries and interest ratings
    """
    system_prompt_summarizer = {
        "role": "system",
        "content": """
        You are a scientific abstract summarizer.
        Your task is to extract key points from research paper abstracts and format them as a Python list of strings.
        Each bullet point should be concise, informative, and capture essential information.
        Always output exactly in this format: ['point 1', 'point 2', 'point 3'] with no additional text or explanations."""}

    system_prompt_interest = {
        "role": "system",
        "content": """
        You are a research relevance evaluator. Your task is to assess how well a research paper abstract matches a given query or research interest. Rate the relevance on a scale of 0-10 where:
    - 0: Completely unrelated
    - 1-3: Minimally related (tangential connection)
    - 4-6: Moderately related (some overlap in topics/methods)
    - 7-9: Highly related (direct relevance to query)
    - 10: Perfectly aligned with the query

    Output only a single integer between 0 and 10 with no additional text or explanation."""}

    async def process_single_paper(title, paper_data):
        """Process a single paper with LLM summarization and interest rating."""
        abstract = paper_data["abstract"]
        url = paper_data["url"]
        journal = paper_data.get("journal")  # Preserve journal if present

        # Summarization with retry logic
        max_attempts = config['api'].get('max_attempts', 3)
        summary_result = None

        for attempt in range(max_attempts):
            try:
                response = await client.chat.completions.create(
                    model=config['api']['openai_model'],
                    messages=[
                        system_prompt_summarizer,
                        {"role": "user", "content": "Summarize the following abstract into 3-5 key bullet points."
                         "Output only the Python list format:\n"
                         f"Title: {title}\n"
                         f"Abstract: {abstract}\n"
                         }]
                )

                output = response.choices[0].message.content
                summary_result = ast.literal_eval(output)
                break  # Success, exit retry loop

            except (ValueError, SyntaxError) as e:
                print(f"Summary attempt {attempt + 1}/{max_attempts} failed for '{title[:50]}...': {e}")
                if attempt == max_attempts - 1:
                    return title, f"Failed to parse output after {max_attempts} attempts, skipping paper: {title}"
            except Exception as e:
                print(f"Unexpected error on summary attempt {attempt + 1}/{max_attempts} for '{title[:50]}...': {e}")
                if attempt == max_attempts - 1:
                    return title, f"Failed after {max_attempts} attempts due to unexpected error, skipping paper: {title}"

        if summary_result is None:
            return title, f"Failed to get summary after {max_attempts} attempts"

        # Interest rating with retry logic (supports optional researcher interests from config)
        rating_attempts = 3
        interest_rating = None
        researcher_interests = config.get('search', {}).get('researcher_interests')
        # Build the user prompt: prefer researcher_interests if provided; include both if query also provided
        if researcher_interests:
            # Include both researcher interests and the query (if present) to give the model full context.
            user_prompt_header = f"Researcher interests: {researcher_interests}\n\nQuery: {query}\n\n"
            user_instructions = "Please rate the relevance of the following abstract to the researcher's interests and the query."
        else:
            user_prompt_header = f"Query: {query}\n\n"
            user_instructions = "Rate the relevance of this abstract to the query."

        for rating_attempt in range(rating_attempts):
            try:
                interest_response = await client.chat.completions.create(
                    model=config['api']['openai_model'],
                    messages=[
                        system_prompt_interest,
                        {"role": "user", "content": user_prompt_header + f"Abstract: {abstract}\n\n{user_instructions}"}
                    ]
                )

                interest_output = interest_response.choices[0].message.content.strip()
                interest_rating = int(interest_output)

                # Validate the rating is in expected range
                if 0 <= interest_rating <= 10:
                    break  # Success, exit retry loop
                else:
                    raise ValueError(f"Rating {interest_rating} is outside valid range 0-10")

            except (ValueError, TypeError) as e:
                print(f"Interest rating attempt {rating_attempt + 1}/{rating_attempts} failed for '{title[:50]}...': {e}")
                if rating_attempt == rating_attempts - 1:
                    interest_rating = f"Failed to get rating after {rating_attempts} attempts"
            except Exception as e:
                print(f"Unexpected error on interest rating attempt {rating_attempt + 1}/{rating_attempts} for '{title[:50]}...': {e}")
                if rating_attempt == rating_attempts - 1:
                    interest_rating = f"Failed to get rating due to unexpected error"

        # Return structured result
        result = {
            'summary': summary_result,
            'interest_rating': interest_rating,
            'url': url,
            'journal': journal
        }

        if isinstance(interest_rating, int):
            print(f"Successfully processed with rating {interest_rating}: {title[:50]}...")
        else:
            print(f"Summary processed but rating failed: {title[:50]}...")

        return title, result

    # Process all papers concurrently using asyncio.gather()
    tasks = []
    for title, paper_data in papers_with_abstracts.items():
        tasks.append(process_single_paper(title, paper_data))

    # Execute all tasks concurrently
    results = await asyncio.gather(*tasks, return_exceptions=True)

    # Build results dictionary
    res = {}
    for result in results:
        if isinstance(result, Exception):
            print(f"Task failed with exception: {result}")
            continue
        title, paper_result = result
        res[title] = paper_result

    return res