html-metadata
Version:
Scrapes metadata of several different standards
97 lines (79 loc) • 4.09 kB
HTML
<html>
<head>
<!--
This file contains entirely invalid metadata and should case parseAll to fail
-->
<title></title>
</head>
<body>
<script type="application/ld+json">
{
"@context" / "http://schema.org",
"@type": "Organization"
"url": "https://www.turtles.com"
}
</script>
<meta name="author" badcontent="Turtle Lvr">
<meta name="robots" badcontent="we welcome our robot overlords"/>
<meta name="description" badcontent="Exposition on the awesomeness of turtles"/>
<meta name="keywords" badcontent="turtle, movie" />
<link rel="apple-touch-icon" badhref="movieturtleapple.png">
<link rel="icon" badhref="movieturtle.png" badtype="image/png">
<link rel="apple-touch-icon" badhref="movieturtleapple2.png" badsize"72x72">
<link rel="icon" badhref="movieturtle2.png" badsize="18x18">
<link rel="canonical" badhref="http://example.com/turtles" />
<link rel="publisher" badhref="https://mediawiki.org"/>
<link rel="author" badhref="http://examples.com/turtlelvr"/>
<link rel="shortlink" badhref="http://example.com/c" />
<!--Open Graph-->
<meta property="og:locale" badcontent="en_US" />
<meta property="og:type" badcontent="video.movie" />
<meta property="og:title" badcontent="Turtles of the Jungle" />
<meta property="og:description" badcontent="A 2008 film about jungle turtles." />
<meta property="og:url" badcontent="http://example.com" />
<meta property="og:site_name" badcontent="Awesome Turtle Movies Website" />
<meta property="og:image" badcontent="http://example.com/turtle.jpg" />
<meta property="og:image" badcontent="http://example.com/shell.jpg" />
<meta property="video:tag" badcontent="turtle" />
<meta property="video:tag" badcontent="movie" />
<meta property="video:tag" badcontent="awesome" />
<meta property="video:director" badcontent="http://www.example.com/PhilTheTurtle" />
<meta property="video:actor" badcontent="http://www.example.com/PatTheTurtle" />
<meta property="video:actor:role" badcontent="Turtle #3" /> <!-- Currently ignored -->
<meta property="video:actor" badcontent="http://www.example.com/SaminaTheTurtle" />
<meta property="video:writer" badcontent="http://www.example.com/TinaTheTurtle" />
<meta property="video:release_date" badcontent="2015-01-14T19:14:27+00:00" />
<meta property="video:duration" badcontent="1000000" />
<!--AL-->
<meta property="al:ios:url" badcontent="turtle://">
<meta property="al:ios:app_store_id" badcontent="000">
<meta property="al:android:url" badcontent="turtle://">
<meta property="al:android:package" badcontent="superturtlearticle.androidapp">
<meta property="al:web:url" badcontent="http://example.com/">
<meta property="al:web:should_fallback" badcontent="true">
<!--Twitter-->
<meta name="twitter:card" badcontent="summary">
<meta name="twitter:site" badcontent="@Turtlessssssssss">
<meta name="twitter:creator" badcontent="@Turtlessssssssss">
<meta name="twitter:url" badcontent="http://www.example.com/turtles">
<meta name="twitter:title" badcontent="Turtles of the Jungle">
<meta name="twitter:description" badcontent="A 2008 film about jungle turtles.">
<meta name="twitter:player" badcontent="http://www.example.com/turtles/player">
<meta name="twitter:player:width" badcontent="400">
<meta name="twitter:player:height" badcontent="400">
<meta name="twitter:player:stream" badcontent="http://www.example.com/turtles/turtle.mp4">
<meta name="twitter:player:stream:badcontent_type" badcontent="video/mp4">
<!--Dublin Core-->
<meta name="DC.Title" badcontent="Turtles of the Jungle" >
<meta name="DC.Creator" badcontent="http://www.example.com/turtlelvr" >
<meta name="DC.Description" badcontent="A 2008 film about jungle turtles." >
<meta name="DC.Date" badcontent="2012-02-04 12:00:00" >
<meta name="DC.Type" badcontent="Image.Moving" >
<!--PRISM-->
<meta name="prism.publicationName" badcontent="Turtles of the Jungle" >
<meta name="prism.publicationDate" badcontent="2012-02-04" >
<meta name="prism.copyright" badcontent="2012 Turtles Society" >
<meta name="prism.rightsAgent" badcontent="permissions@turtles.com" >
<meta name="prism.url" badcontent="https://www.turtles.com" >
</body>
</html>