unfluff
Version:
A web page content extractor
12 lines • 600 B
JSON
{
"url": "http://www.tulsaworld.com/site/articlepath.aspx?articleid=20111118_61_A16_Opposi344152&rss_lnk=7",
"expected": {
"meta_description": "",
"domain": "www.tulsaworld.com",
"final_url": "http://www.tulsaworld.com/site/articlepath.aspx?articleid=20111118_61_A16_Opposi344152&rss_lnk=7",
"meta_keywords": "COURT RULE INFORMATION RECORDS DISTRICT OKLAHOMA PERSONAL PROPOSAL PROPOSED REASONS",
"cleaned_text": "Opposition to a proposal to remove certain personal data",
"meta_favicon": "/favicon.ico",
"meta_lang": null
}
}