feat(backend): add TfL disruptions API with Gemini AI shortening
- Add TfL Unified API integration for real-time transport disruptions - Implement batch AI shortening using Gemini 2.5 Flash-Lite - Add in-memory caching with 1-hour TTL - Support Tube, Overground, DLR, Elizabeth Line, and Tram - Sort disruptions by severity with regex-based line name cleanup Co-authored-by: Ona <no-reply@ona.com>
This commit is contained in:
204
apps/backend/src/tfl/gemini.ts
Normal file
204
apps/backend/src/tfl/gemini.ts
Normal file
@@ -0,0 +1,204 @@
|
||||
/**
|
||||
* Gemini AI integration for shortening TfL disruption descriptions
|
||||
*/
|
||||
|
||||
import { getCachedShortened, setCachedShortened } from "./cache"
|
||||
|
||||
interface DisruptionToShorten {
|
||||
lineName: string
|
||||
status: string
|
||||
reason: string
|
||||
}
|
||||
|
||||
interface ShortenedResult {
|
||||
lineName: string
|
||||
shortened: string
|
||||
}
|
||||
|
||||
/**
|
||||
* Strip line name prefix from description
|
||||
*/
|
||||
function stripLineName(text: string, lineName: string): string {
|
||||
// Escape special regex characters in line name
|
||||
const escapedName = lineName.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')
|
||||
|
||||
// Remove patterns like "Central Line:", "CENTRAL LINE:", "Mildmay Line:", etc.
|
||||
const patterns = [
|
||||
new RegExp(`^${escapedName}\\s*Line:\\s*`, "i"),
|
||||
new RegExp(`^${escapedName}:\\s*`, "i"),
|
||||
new RegExp(`^${escapedName.toUpperCase()}\\s*LINE:\\s*`),
|
||||
]
|
||||
|
||||
let result = text
|
||||
for (const pattern of patterns) {
|
||||
result = result.replace(pattern, "")
|
||||
}
|
||||
|
||||
return result.trim()
|
||||
}
|
||||
|
||||
/**
|
||||
* Shorten multiple disruption reasons in a single Gemini API call
|
||||
*/
|
||||
export async function shortenMultipleDisruptions(
|
||||
disruptions: DisruptionToShorten[]
|
||||
): Promise<Map<string, string>> {
|
||||
const apiKey = process.env.GEMINI_API_KEY
|
||||
const results = new Map<string, string>()
|
||||
|
||||
if (!apiKey) {
|
||||
console.warn("GEMINI_API_KEY not set, returning stripped versions")
|
||||
for (const disruption of disruptions) {
|
||||
results.set(disruption.lineName, stripLineName(disruption.reason, disruption.lineName))
|
||||
}
|
||||
return results
|
||||
}
|
||||
|
||||
// Filter disruptions that need shortening
|
||||
const toShorten: DisruptionToShorten[] = []
|
||||
|
||||
for (const disruption of disruptions) {
|
||||
const stripped = stripLineName(disruption.reason, disruption.lineName)
|
||||
|
||||
// Check cache first
|
||||
const cached = getCachedShortened(disruption.reason)
|
||||
if (cached) {
|
||||
results.set(disruption.lineName, cached)
|
||||
continue
|
||||
}
|
||||
|
||||
// If already short after stripping, use that
|
||||
if (stripped.length < 80) {
|
||||
results.set(disruption.lineName, stripped)
|
||||
setCachedShortened(disruption.reason, stripped)
|
||||
continue
|
||||
}
|
||||
|
||||
// Needs shortening
|
||||
toShorten.push({ ...disruption, reason: stripped })
|
||||
}
|
||||
|
||||
// If nothing needs shortening, return early
|
||||
if (toShorten.length === 0) {
|
||||
return results
|
||||
}
|
||||
|
||||
// Build batch prompt
|
||||
const prompt = buildBatchShorteningPrompt(toShorten)
|
||||
|
||||
try {
|
||||
const response = await fetch(
|
||||
`https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash-lite:generateContent?key=${apiKey}`,
|
||||
{
|
||||
method: "POST",
|
||||
headers: {
|
||||
"Content-Type": "application/json",
|
||||
},
|
||||
body: JSON.stringify({
|
||||
contents: [
|
||||
{
|
||||
parts: [
|
||||
{
|
||||
text: prompt,
|
||||
},
|
||||
],
|
||||
},
|
||||
],
|
||||
generationConfig: {
|
||||
temperature: 0.3,
|
||||
maxOutputTokens: 2000, // Higher limit to account for thinking tokens in Gemini 2.5 Flash
|
||||
topP: 0.9,
|
||||
},
|
||||
}),
|
||||
}
|
||||
)
|
||||
|
||||
if (!response.ok) {
|
||||
console.error(`Gemini API error: ${response.status}`)
|
||||
// Fallback to stripped versions
|
||||
for (const disruption of toShorten) {
|
||||
results.set(disruption.lineName, disruption.reason)
|
||||
}
|
||||
return results
|
||||
}
|
||||
|
||||
const data = (await response.json()) as any
|
||||
const responseText = data.candidates?.[0]?.content?.parts?.[0]?.text?.trim() || ""
|
||||
|
||||
// Parse JSON response
|
||||
try {
|
||||
// Extract JSON from markdown code blocks if present
|
||||
let jsonText = responseText
|
||||
const jsonMatch = responseText.match(/```json\s*([\s\S]*?)\s*```/)
|
||||
if (jsonMatch) {
|
||||
jsonText = jsonMatch[1]
|
||||
}
|
||||
|
||||
const shortened = JSON.parse(jsonText) as ShortenedResult[]
|
||||
|
||||
// Map results
|
||||
for (const item of shortened) {
|
||||
results.set(item.lineName, item.shortened)
|
||||
// Cache the result
|
||||
const original = toShorten.find(d => d.lineName === item.lineName)
|
||||
if (original) {
|
||||
setCachedShortened(original.reason, item.shortened)
|
||||
}
|
||||
}
|
||||
} catch (parseError) {
|
||||
console.error("Failed to parse Gemini JSON response:", parseError)
|
||||
console.error("Response was:", responseText)
|
||||
// Fallback to stripped versions
|
||||
for (const disruption of toShorten) {
|
||||
results.set(disruption.lineName, disruption.reason)
|
||||
}
|
||||
}
|
||||
} catch (error) {
|
||||
console.error("Failed to shorten disruptions:", error)
|
||||
// Fallback to stripped versions
|
||||
for (const disruption of toShorten) {
|
||||
results.set(disruption.lineName, disruption.reason)
|
||||
}
|
||||
}
|
||||
|
||||
return results
|
||||
}
|
||||
|
||||
/**
|
||||
* Builds a batch prompt for Gemini to shorten multiple disruptions at once
|
||||
*/
|
||||
function buildBatchShorteningPrompt(disruptions: DisruptionToShorten[]): string {
|
||||
const disruptionsList = disruptions.map((d, i) =>
|
||||
`${i + 1}. Line: ${d.lineName}\n Status: ${d.status}\n Message: "${d.reason}"`
|
||||
).join('\n\n')
|
||||
|
||||
return `Shorten these London transport disruption messages for a dashboard display. Return your response as a JSON array.
|
||||
|
||||
Disruptions to shorten:
|
||||
${disruptionsList}
|
||||
|
||||
Requirements:
|
||||
- Keep each shortened message under 80 characters
|
||||
- Be concise but keep essential information (reason, locations, alternatives, time info)
|
||||
- DO NOT include line names in the shortened text (they're displayed separately)
|
||||
- Use natural, clear language
|
||||
- NO emojis
|
||||
|
||||
Return ONLY a JSON array in this exact format:
|
||||
[
|
||||
{"lineName": "Piccadilly", "shortened": "Suspended Rayners Lane-Uxbridge until Fri due to Storm Benjamin. Use Metropolitan line."},
|
||||
{"lineName": "Central", "shortened": "Minor delays due to train cancellations"},
|
||||
...
|
||||
]
|
||||
|
||||
Good examples of shortened messages:
|
||||
- "Suspended Rayners Lane-Uxbridge until Fri due to Storm Benjamin. Use Metropolitan line."
|
||||
- "Minor delays due to train cancellations"
|
||||
- "Minor delays due to earlier incidents at Gospel Oak & Highbury"
|
||||
- "Severe delays - signal failure at King's Cross. Use buses/Elizabeth line."
|
||||
- "No service Earls Court-Wimbledon until Sun 27 Oct (engineering)"
|
||||
|
||||
Generate JSON array:`
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user