/**
 * Extracts the title from HTML content if available
 * @param htmlContent The HTML content
 * @returns The extracted title or undefined
 */
export declare function extractTitleFromHTML(htmlContent: string): string | undefined;
/**
 * Finds potential image URLs in the HTML content
 * @param htmlContent The HTML content
 * @returns The first potential image URL or undefined
 */
export declare function extractImageFromHTML(htmlContent: string): string | undefined;
/**
 * Cleans and normalizes text based on its detected language
 * @param text The text to clean
 * @returns The cleaned text
 */
export declare function cleanText(text: string): string;
/**
 * Applies Arabic-specific text sanitization
 * @param text The Arabic text to sanitize
 * @returns The sanitized text
 */
export declare function sanitizeArabicText(text: string): string;
/**
 * Extracts sentences from text
 * @param text The text to extract sentences from
 * @returns An array of sentences
 */
export declare function extractSentences(text: string): string[];
