1 /* Parses a Google movies web (previously downloaded on a file)
2 * using libxml2. Examples of Google movies web files can be
3 * found in the gmovies_data directory.
6 #include <libxml/HTMLparser.h>
7 #include <libxml/tree.h>
11 int main (int argc, char ** argv)
15 printf("usage: gmovies file.html\n");
19 htmlDocPtr doc = htmlReadFile(argv[1], "UTF-8", 0);
21 xmlNodePtr root = xmlDocGetRootElement(doc);//html
23 xmlNodePtr body = xmlLastElementChild(root);//body
25 xmlNodePtr elem = xmlFirstElementChild(body);
28 elem = xmlNextElementSibling(elem);
32 elem = xmlFirstElementChild(elem); //tr
33 elem = xmlFirstElementChild(elem); //td
34 elem = xmlFirstElementChild(elem); //a
35 elem = xmlFirstElementChild(elem); //b
37 printf("First theater = %s\n", xmlNodeGetContent(elem));