1 <html> 2 <!-- 3 This page is used to test that WebPageSerializer::retrieveAllResources retrieves 4 correctly the expected resources from various HTML nodes. 5 --> 6 7 <head> 8 <!-- Style sheet links should be retrieved --> 9 <link rel="stylesheet" type="text/css" href="http://www.example.com/beautifull.css"/> 10 <!-- Other link should NOT be retrieved --> 11 <link rel="copyright" type="text/plain" href="http://www.example.com/copyright"/> 12 <!-- Scripts should be retrieved --> 13 <script src="awesome.js"></script> 14 </head> 15 16 <!-- Images are always retrieved --> 17 <body background="bodyBackground.jpg"> 18 19 <!-- Twice to make sure we only report each resource once --> 20 <img src="awesome.png"/> 21 <img src="awesome.png"/> 22 23 <form> 24 <input type="image" src="imageButton.png"/> 25 </form> 26 27 <table background="tableBackground.png"> 28 <tr background="trBackground.png"> 29 <td background="tdBackground.png"></td> 30 </tr> 31 <tr background="trBackground.png"> 32 <td background="tdBackground.png"></td> 33 </tr> 34 </table> 35 36 <!-- Some more obscure tags --> 37 <blockquote cite="http://www.evene.fr/citations/auteur.php?ida=46"></blockquote> 38 <q CITE="http://www.brainyquote.com/quotes/authors/c/charles_darwin.html"></q> 39 <p>My favorite color is <del cite="why_deleted.html">blue</del> <ins>red</ins>!</p> 40 <p>My favorite color is <del>blue</del> <ins cite="why_inserted.html">red</ins>!</p> 41 42 <!-- Make sure we only retrieve URLs with the right schemes --> 43 <img src="https://www.secure.com/https.gif"/> <!-- HTTPS is OK --> 44 <img src="file://c/my_folder/file.gif"/> <!-- file is OK --> 45 <img src="ftp://ftp.com/ftp.gif"/> <!-- FTP is not OK --> 46 <img src="unknown://unkown.com/unknown.gif"/> <!-- Unknown schemes are not OK --> 47 48 </body> 49 50 </html> 51