Update app.py
Browse files
app.py
CHANGED
|
@@ -6,7 +6,9 @@ import logging
|
|
| 6 |
from typing import Tuple, Literal
|
| 7 |
import functools
|
| 8 |
import spaces
|
| 9 |
-
from
|
|
|
|
|
|
|
| 10 |
# Set up logging
|
| 11 |
logging.basicConfig(level=logging.INFO)
|
| 12 |
logger = logging.getLogger(__name__)
|
|
@@ -16,8 +18,8 @@ MODEL_NAME = "davanstrien/Smol-Hub-tldr"
|
|
| 16 |
model = None
|
| 17 |
tokenizer = None
|
| 18 |
device = None
|
| 19 |
-
|
| 20 |
-
|
| 21 |
|
| 22 |
def load_model():
|
| 23 |
global model, tokenizer, device
|
|
@@ -87,9 +89,9 @@ def _generate_summary_gpu(card_text: str, card_type: str) -> str:
|
|
| 87 |
|
| 88 |
return summary
|
| 89 |
|
| 90 |
-
@
|
| 91 |
def generate_summary(card_text: str, card_type: str) -> str:
|
| 92 |
-
"""Cached wrapper for generate_summary."""
|
| 93 |
return _generate_summary_gpu(card_text, card_type)
|
| 94 |
|
| 95 |
def summarize(hub_id: str = "", card_type: str = "model", content: str = "") -> str:
|
|
|
|
| 6 |
from typing import Tuple, Literal
|
| 7 |
import functools
|
| 8 |
import spaces
|
| 9 |
+
from cachetools import TTLCache
|
| 10 |
+
from cachetools.func import ttl_cache
|
| 11 |
+
import time
|
| 12 |
# Set up logging
|
| 13 |
logging.basicConfig(level=logging.INFO)
|
| 14 |
logger = logging.getLogger(__name__)
|
|
|
|
| 18 |
model = None
|
| 19 |
tokenizer = None
|
| 20 |
device = None
|
| 21 |
+
CACHE_TTL = 6 * 60 * 60 # 6 hours in seconds
|
| 22 |
+
CACHE_MAXSIZE = 100
|
| 23 |
|
| 24 |
def load_model():
|
| 25 |
global model, tokenizer, device
|
|
|
|
| 89 |
|
| 90 |
return summary
|
| 91 |
|
| 92 |
+
@ttl_cache(maxsize=CACHE_MAXSIZE, ttl=CACHE_TTL)
|
| 93 |
def generate_summary(card_text: str, card_type: str) -> str:
|
| 94 |
+
"""Cached wrapper for generate_summary with TTL."""
|
| 95 |
return _generate_summary_gpu(card_text, card_type)
|
| 96 |
|
| 97 |
def summarize(hub_id: str = "", card_type: str = "model", content: str = "") -> str:
|