/* This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see https://www.gnu.org/licenses/. © 2021 dogeystamp */ #include #include #include #include #include #include #include #include "util.h" #include "xml.h" #define TAGIS(X, Y) (!xmlStrcmp(X->name, (const xmlChar *) Y)) void freeItem(itemStruct *item) { // Free the memory used by an article. char **mems[] = { &item->title, &item->link, &item->description, }; for (unsigned long int i = 0; i < LEN(mems); i++) { if (*mems[i]) free(*mems[i]); } free(item); } static int parseXml(xmlDocPtr doc, const char *feedName, void itemAction(itemStruct *, const char *)) { // Parse the XML in a single document. if (!feedName || !feedName[0]) { logMsg(1, "Missing feed name, please set one.\n"); return 1; } xmlNodePtr rootNode; rootNode = xmlDocGetRootElement(doc); if (!rootNode) { logMsg(1, "Empty document for feed.\n"); return 1; } enum feedFormat format = none; if (TAGIS(rootNode, "rss")) { format = rss; } else if (TAGIS(rootNode, "feed")) { if (!xmlStrcmp(rootNode->ns->href, (const xmlChar *) "http://www.w3.org/2005/Atom")) format = atom; } if (format == none) { logMsg(1, "XML document is not an RSS or Atom feed.\n"); return 1; } // Pointer to the first child of the root XML node xmlNodePtr cur = rootNode->children; switch (format) { case rss: // Get channel XML tag while(cur && !TAGIS(cur, "channel")) cur = cur->next; if (!cur || !TAGIS(cur, "channel")) { logMsg(1, "Invalid RSS syntax.\n"); return 1; } // Set cur to child of channel cur = cur->children; break; case atom: // Set cur to child of feed cur = rootNode->children; break; default: logMsg(1, "Missing starting tag for format\n"); return 1; } // Previous item (to build a linked list later) itemStruct *prev = NULL; // Loop over articles (skipping non-article tags) while (cur) { short isArticle = 0; switch (format) { case rss: isArticle = TAGIS(cur, "item"); break; case atom: isArticle = TAGIS(cur, "entry"); break; default: logMsg(1, "Missing article tag name for format\n"); return 1; } if (isArticle) { itemStruct *item = ecalloc(1, sizeof(itemStruct)); // The selected set of attribute keys char **attKeys; // Struct variables to map attributes to char **atts[] = { &item->title, &item->link, &item->description, }; // Attribute keys for each format char *attKeysRss[LEN(atts)] = { "title", "link", "description", }; char *attKeysAtom[LEN(atts)] = { "title", // link has special treatment because its value is in href not within the tag "", "content", }; switch (format) { case rss: attKeys = attKeysRss; break; case atom: attKeys = attKeysAtom; break; default: logMsg(1, "Missing article attribute keys for format\n"); return 1; }; // Build a linked list of item structs to pass to itemAction() item->next = prev; prev = item; xmlNodePtr itemNode = cur->children; // Value within the tag char *itemKey; while (itemNode) { itemKey = (char *)xmlNodeListGetString(doc, itemNode->children, 1); if (itemKey) { for (unsigned long int i = 0; i < LEN(atts); i++) { if (TAGIS(itemNode, attKeys[i])) { size_t keyLen = strlen(itemKey) + 1; *atts[i] = ecalloc(keyLen, sizeof(char)); memcpy(*atts[i], itemKey, keyLen * sizeof(char)); break; } } xmlFree(itemKey); } // Exceptions // Atom entry link tag if (format == atom && TAGIS(itemNode, "link")) { xmlChar *link = xmlGetProp(itemNode, (xmlChar *) "href"); if (!link) { logMsg(1, "Missing Atom entry link\n"); xmlFree(link); return 1; } size_t linkLen = strlen((char *) link) + 1; item->link = ecalloc(linkLen, sizeof(char)); memcpy(item->link, (char *) link, linkLen * sizeof(char)); xmlFree(link); } itemNode = itemNode->next; } } cur = cur->next; } errno = 0; int stat = mkdir((const char* ) feedName, S_IRWXU); if (!stat && errno && errno != EEXIST) { logMsg(1, "Error creating directory for feed.\n"); return 1; } itemAction(prev, feedName); return 0; } int readDoc(char *content, const char *feedName, void itemAction(itemStruct *, const char *)) { // Initialize the XML document, read it, then free it xmlDocPtr doc; doc = xmlReadMemory(content, strlen(content), "noname.xml", NULL, 0); if (!doc) { logMsg(1, "XML parser error.\n"); return 1; } int stat = parseXml(doc, feedName, itemAction); if (stat) logMsg(1, "Skipped feed %s due to errors.\n", feedName); xmlFreeDoc(doc); return stat; }