UNPKG

html-metadata

Version:

Scrapes metadata of several different standards

97 lines (79 loc) 4.09 kB
<html> <head> <!-- This file contains entirely invalid metadata and should case parseAll to fail --> <title></title> </head> <body> <script type="application/ld+json"> { "@context" / "http://schema.org", "@type": "Organization" "url": "https://www.turtles.com" } </script> <meta name="author" badcontent="Turtle Lvr"> <meta name="robots" badcontent="we welcome our robot overlords"/> <meta name="description" badcontent="Exposition on the awesomeness of turtles"/> <meta name="keywords" badcontent="turtle, movie" /> <link rel="apple-touch-icon" badhref="movieturtleapple.png"> <link rel="icon" badhref="movieturtle.png" badtype="image/png"> <link rel="apple-touch-icon" badhref="movieturtleapple2.png" badsize"72x72"> <link rel="icon" badhref="movieturtle2.png" badsize="18x18"> <link rel="canonical" badhref="http://example.com/turtles" /> <link rel="publisher" badhref="https://mediawiki.org"/> <link rel="author" badhref="http://examples.com/turtlelvr"/> <link rel="shortlink" badhref="http://example.com/c" /> <!--Open Graph--> <meta property="og:locale" badcontent="en_US" /> <meta property="og:type" badcontent="video.movie" /> <meta property="og:title" badcontent="Turtles of the Jungle" /> <meta property="og:description" badcontent="A 2008 film about jungle turtles." /> <meta property="og:url" badcontent="http://example.com" /> <meta property="og:site_name" badcontent="Awesome Turtle Movies Website" /> <meta property="og:image" badcontent="http://example.com/turtle.jpg" /> <meta property="og:image" badcontent="http://example.com/shell.jpg" /> <meta property="video:tag" badcontent="turtle" /> <meta property="video:tag" badcontent="movie" /> <meta property="video:tag" badcontent="awesome" /> <meta property="video:director" badcontent="http://www.example.com/PhilTheTurtle" /> <meta property="video:actor" badcontent="http://www.example.com/PatTheTurtle" /> <meta property="video:actor:role" badcontent="Turtle #3" /> <!-- Currently ignored --> <meta property="video:actor" badcontent="http://www.example.com/SaminaTheTurtle" /> <meta property="video:writer" badcontent="http://www.example.com/TinaTheTurtle" /> <meta property="video:release_date" badcontent="2015-01-14T19:14:27+00:00" /> <meta property="video:duration" badcontent="1000000" /> <!--AL--> <meta property="al:ios:url" badcontent="turtle://"> <meta property="al:ios:app_store_id" badcontent="000"> <meta property="al:android:url" badcontent="turtle://"> <meta property="al:android:package" badcontent="superturtlearticle.androidapp"> <meta property="al:web:url" badcontent="http://example.com/"> <meta property="al:web:should_fallback" badcontent="true"> <!--Twitter--> <meta name="twitter:card" badcontent="summary"> <meta name="twitter:site" badcontent="@Turtlessssssssss"> <meta name="twitter:creator" badcontent="@Turtlessssssssss"> <meta name="twitter:url" badcontent="http://www.example.com/turtles"> <meta name="twitter:title" badcontent="Turtles of the Jungle"> <meta name="twitter:description" badcontent="A 2008 film about jungle turtles."> <meta name="twitter:player" badcontent="http://www.example.com/turtles/player"> <meta name="twitter:player:width" badcontent="400"> <meta name="twitter:player:height" badcontent="400"> <meta name="twitter:player:stream" badcontent="http://www.example.com/turtles/turtle.mp4"> <meta name="twitter:player:stream:badcontent_type" badcontent="video/mp4"> <!--Dublin Core--> <meta name="DC.Title" badcontent="Turtles of the Jungle" > <meta name="DC.Creator" badcontent="http://www.example.com/turtlelvr" > <meta name="DC.Description" badcontent="A 2008 film about jungle turtles." > <meta name="DC.Date" badcontent="2012-02-04 12:00:00" > <meta name="DC.Type" badcontent="Image.Moving" > <!--PRISM--> <meta name="prism.publicationName" badcontent="Turtles of the Jungle" > <meta name="prism.publicationDate" badcontent="2012-02-04" > <meta name="prism.copyright" badcontent="2012 Turtles Society" > <meta name="prism.rightsAgent" badcontent="permissions@turtles.com" > <meta name="prism.url" badcontent="https://www.turtles.com" > </body> </html>