unfluff
Version:
A web page content extractor
20 lines (19 loc) • 1 kB
JSON
{
"url": "http://www.aolnews.com/nation/article/the-few-the-proud-the-marines-getting-a-makeover/19592478",
"expected": {
"meta_description": "(Aug. 13) -- Declaring",
"domain": "www.aolnews.com",
"final_url": "http://www.aolnews.com/nation/article/the-few-the-proud-the-marines-getting-a-makeover/19592478",
"meta_keywords": "news, update, breaking, nation, U.S., elections, world, entertainment, sports, business, weird news, health, science, latest news articles, breaking news, current news, top news",
"cleaned_text": "WASHINGTON (Aug. 13) -- Declaring \"the maritime soul of the Marine Corps\" is",
"tags": [
"Defense Secretary Robert Gates",
"military",
"Marines",
"armed forces"
],
"meta_favicon": "http://o.aolcdn.com/art/ch_news/aol_favicon.ico",
"meta_lang": "en",
"image": "http://o.aolcdn.com/photo-hub/news_gallery/6/8/680919/1281734929876.JPEG "
}
}