/* This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see https://www.gnu.org/licenses/. © 2021 dogeystamp */ #include #include #include #include #include #include #include #include #include #include #include "util.h" #include "net.h" #include "handlers.h" #include "config.h" #define TAGIS(X, Y) (!xmlStrcmp(X->name, (const xmlChar *) Y)) static int parseXml(xmlDocPtr doc, const char *feedName, void itemAction(itemStruct *, const char *)) { // Parse the XML in a single document. if (!feedName || !feedName[0]) { logMsg(1, "Missing feed name, please set one.\n"); return 1; } xmlNodePtr rootNode; rootNode = xmlDocGetRootElement(doc); if (!rootNode) { logMsg(1, "Empty document for feed.\n"); return 1; } enum feedFormat format = NONE; if (TAGIS(rootNode, "rss")) { format = RSS; } else if (TAGIS(rootNode, "feed")) { if (!xmlStrcmp(rootNode->ns->href, (const xmlChar *) "http://www.w3.org/2005/Atom")) format = ATOM; } if (format == NONE) { logMsg(1, "XML document is not an RSS or Atom feed.\n"); return 1; } // Pointer to the first child of the root XML node xmlNodePtr cur = rootNode->children; switch (format) { case RSS: // Get channel XML tag while(cur && !TAGIS(cur, "channel")) cur = cur->next; if (!cur || !TAGIS(cur, "channel")) { logMsg(1, "Invalid RSS syntax.\n"); return 1; } // Set cur to child of channel cur = cur->children; break; case ATOM: // Set cur to child of feed cur = rootNode->children; break; default: logMsg(1, "Missing starting tag for format\n"); return 1; } // Previous item (to build a linked list later) itemStruct *prev = NULL; // Loop over articles (skipping non-article tags) while (cur) { short isArticle = 0; switch (format) { case RSS: isArticle = TAGIS(cur, "item"); break; case ATOM: isArticle = TAGIS(cur, "entry"); break; default: logMsg(1, "Missing article tag name for format\n"); return 1; } if (isArticle) { itemStruct *item = ecalloc(1, sizeof(itemStruct)); // Build a linked list of item structs to pass to itemAction() item->next = prev; prev = item; xmlNodePtr itemNode = cur->children; // Value within the tag char *itemKey; while (itemNode) { itemKey = (char *)xmlNodeListGetString(doc, itemNode->children, 1); switch (format) { case RSS: if TAGIS(itemNode, "link") copyField(item, FIELD_LINK, itemKey); else if TAGIS(itemNode, "description") copyField(item, FIELD_DESCRIPTION, itemKey); else if TAGIS(itemNode, "title") copyField(item, FIELD_TITLE, itemKey); else if TAGIS(itemNode, "enclosure") rssEnclosure(item, itemNode); break; case ATOM: if TAGIS(itemNode, "link") atomLink(item, itemNode); else if TAGIS(itemNode, "content") copyField(item, FIELD_DESCRIPTION, itemKey); else if TAGIS(itemNode, "title") copyField(item, FIELD_TITLE, itemKey); break; default: break; } xmlFree(itemKey); itemNode = itemNode->next; } } cur = cur->next; } errno = 0; int stat = mkdir((const char* ) feedName, S_IRWXU); if (!stat && errno && errno != EEXIST) { logMsg(1, "Error creating directory for feed.\n"); return 1; } itemAction(prev, feedName); return 0; } int readDoc(char *content, const char *feedName, void itemAction(itemStruct *, const char *)) { // Initialize the XML document, read it, then free it xmlDocPtr doc; doc = xmlReadMemory(content, strlen(content), "noname.xml", NULL, 0); if (!doc) { logMsg(1, "XML parser error.\n"); return 1; } int stat = parseXml(doc, feedName, itemAction); if (stat) logMsg(1, "Skipped feed %s due to errors.\n", feedName); xmlFreeDoc(doc); return stat; } int main(int argc, char *argv[]) { if (argc == 2 && !strcmp("-v", argv[1])) logMsg(0, "MinRSS %s\n", VERSION); else if (argc != 1) logMsg(0, "Usage: minrss [-v]\n"); unsigned int i = 0; initCurl(); outputStruct outputs[LEN(links)]; memset(outputs, 0, sizeof(outputs)); for (i = 0; i < LEN(links); i++) { if (links[0].url[0] == '\0') logMsg(0, "No feeds, add them in config.def.h\n"); logMsg(4, "Requesting %s\n", links[i].url); createRequest(links[i].url, &outputs[i]); } performRequests(finish); logMsg(3, "Finished downloads.\n"); for (i = 0; i < LEN(links); i++) { logMsg(5, "Parsing %s\n", links[i].url); if (outputs[i].buffer && outputs[i].buffer[0]) { readDoc(outputs[i].buffer, links[i].feedName, itemAction); free(outputs[i].buffer); } } logMsg(3, "Finished parsing feeds.\n"); return 0; }