Spaces:
Sleeping
Sleeping
| import math | |
| import matplotlib.pyplot as plt | |
| GREEN = "\033[92m" | |
| YELLOW = "\033[93m" | |
| RED = "\033[91m" | |
| RESET = "\033[0m" | |
| COLOR_MAP = {"red":RED, "orange": YELLOW, "green": GREEN} | |
| class Tester: | |
| def __init__(self, predictor, data, title=None, size=250): | |
| self.predictor = predictor | |
| self.data = data | |
| self.title = title or predictor.__name__.replace("_", " ").title() | |
| self.size = size | |
| self.guesses = [] | |
| self.truths = [] | |
| self.errors = [] | |
| self.sles = [] | |
| self.colors = [] | |
| def color_for(self, error, truth): | |
| if error<40 or error/truth < 0.2: | |
| return "green" | |
| elif error<80 or error/truth < 0.4: | |
| return "orange" | |
| else: | |
| return "red" | |
| def run_datapoint(self, i): | |
| datapoint = self.data[i] | |
| guess = self.predictor(datapoint) | |
| truth = datapoint.price | |
| error = abs(guess - truth) | |
| log_error = math.log(truth+1) - math.log(guess+1) | |
| sle = log_error ** 2 | |
| color = self.color_for(error, truth) | |
| title = datapoint.title if len(datapoint.title) <= 40 else datapoint.title[:40]+"..." | |
| self.guesses.append(guess) | |
| self.truths.append(truth) | |
| self.errors.append(error) | |
| self.sles.append(sle) | |
| self.colors.append(color) | |
| print(f"{COLOR_MAP[color]}{i+1}: Guess: ${guess:,.2f} Truth: ${truth:,.2f} Error: ${error:,.2f} SLE: {sle:,.2f} Item: {title}{RESET}") | |
| def chart(self, title): | |
| max_error = max(self.errors) | |
| plt.figure(figsize=(12, 8)) | |
| max_val = max(max(self.truths), max(self.guesses)) | |
| plt.plot([0, max_val], [0, max_val], color='deepskyblue', lw=2, alpha=0.6) | |
| plt.scatter(self.truths, self.guesses, s=3, c=self.colors) | |
| plt.xlabel('Ground Truth') | |
| plt.ylabel('Model Estimate') | |
| plt.xlim(0, max_val) | |
| plt.ylim(0, max_val) | |
| plt.title(title) | |
| plt.show() | |
| def report(self): | |
| average_error = sum(self.errors) / self.size | |
| rmsle = math.sqrt(sum(self.sles) / self.size) | |
| hits = sum(1 for color in self.colors if color=="green") | |
| title = f"{self.title} Error=${average_error:,.2f} RMSLE={rmsle:,.2f} Hits={hits/self.size*100:.1f}%" | |
| self.chart(title) | |
| def run(self): | |
| self.error = 0 | |
| for i in range(self.size): | |
| self.run_datapoint(i) | |
| self.report() | |
| def test(cls, function, data): | |
| cls(function, data).run() |