Spaces:

mamogasr
/

llm_engineering

Sleeping

App Files Files Community

llm_engineering / week8 /agents /scanner_agent.py

mamogasr

Upload folder using huggingface_hub

5fdb69e verified 7 months ago

raw

history blame contribute delete

4.7 kB

	import os
	import json
	from typing import Optional, List
	from openai import OpenAI
	from agents.deals import ScrapedDeal, DealSelection
	from agents.agent import Agent


	class ScannerAgent(Agent):

	MODEL = "gpt-4o-mini"

	SYSTEM_PROMPT = """You identify and summarize the 5 most detailed deals from a list, by selecting deals that have the most detailed, high quality description and the most clear price.
	Respond strictly in JSON with no explanation, using this format. You should provide the price as a number derived from the description. If the price of a deal isn't clear, do not include that deal in your response.
	Most important is that you respond with the 5 deals that have the most detailed product description with price. It's not important to mention the terms of the deal; most important is a thorough description of the product.
	Be careful with products that are described as "$XXX off" or "reduced by $XXX" - this isn't the actual price of the product. Only respond with products when you are highly confident about the price.

	{"deals": [
	{
	"product_description": "Your clearly expressed summary of the product in 4-5 sentences. Details of the item are much more important than why it's a good deal. Avoid mentioning discounts and coupons; focus on the item itself. There should be a paragpraph of text for each item you choose.",
	"price": 99.99,
	"url": "the url as provided"
	},
	...
	]}"""

	USER_PROMPT_PREFIX = """Respond with the most promising 5 deals from this list, selecting those which have the most detailed, high quality product description and a clear price that is greater than 0.
	Respond strictly in JSON, and only JSON. You should rephrase the description to be a summary of the product itself, not the terms of the deal.
	Remember to respond with a paragraph of text in the product_description field for each of the 5 items that you select.
	Be careful with products that are described as "$XXX off" or "reduced by $XXX" - this isn't the actual price of the product. Only respond with products when you are highly confident about the price.

	Deals:

	"""

	USER_PROMPT_SUFFIX = "\n\nStrictly respond in JSON and include exactly 5 deals, no more."

	name = "Scanner Agent"
	color = Agent.CYAN

	def __init__(self):
	"""
	Set up this instance by initializing OpenAI
	"""
	self.log("Scanner Agent is initializing")
	self.openai = OpenAI()
	self.log("Scanner Agent is ready")

	def fetch_deals(self, memory) -> List[ScrapedDeal]:
	"""
	Look up deals published on RSS feeds
	Return any new deals that are not already in the memory provided
	"""
	self.log("Scanner Agent is about to fetch deals from RSS feed")
	urls = [opp.deal.url for opp in memory]
	scraped = ScrapedDeal.fetch()
	result = [scrape for scrape in scraped if scrape.url not in urls]
	self.log(f"Scanner Agent received {len(result)} deals not already scraped")
	return result

	def make_user_prompt(self, scraped) -> str:
	"""
	Create a user prompt for OpenAI based on the scraped deals provided
	"""
	user_prompt = self.USER_PROMPT_PREFIX
	user_prompt += '\n\n'.join([scrape.describe() for scrape in scraped])
	user_prompt += self.USER_PROMPT_SUFFIX
	return user_prompt

	def scan(self, memory: List[str]=[]) -> Optional[DealSelection]:
	"""
	Call OpenAI to provide a high potential list of deals with good descriptions and prices
	Use StructuredOutputs to ensure it conforms to our specifications
	:param memory: a list of URLs representing deals already raised
	:return: a selection of good deals, or None if there aren't any
	"""
	scraped = self.fetch_deals(memory)
	if scraped:
	user_prompt = self.make_user_prompt(scraped)
	self.log("Scanner Agent is calling OpenAI using Structured Output")
	result = self.openai.beta.chat.completions.parse(
	model=self.MODEL,
	messages=[
	{"role": "system", "content": self.SYSTEM_PROMPT},
	{"role": "user", "content": user_prompt}
	],
	response_format=DealSelection
	)
	result = result.choices[0].message.parsed
	result.deals = [deal for deal in result.deals if deal.price>0]
	self.log(f"Scanner Agent received {len(result.deals)} selected deals with price>0 from OpenAI")
	return result
	return None