From 60b4c9e4307647b66b3ecfd911f401162f3e9926 Mon Sep 17 00:00:00 2001 From: makefu Date: Sat, 24 Sep 2022 00:30:52 +0200 Subject: ma rss: rip sofa --- makefu/2configs/deployment/rss/sofa-urls | 1 - makefu/2configs/deployment/rss/sofa.nix | 26 -------------- makefu/2configs/deployment/rss/sofa.yml | 59 -------------------------------- 3 files changed, 86 deletions(-) delete mode 100644 makefu/2configs/deployment/rss/sofa-urls delete mode 100644 makefu/2configs/deployment/rss/sofa.nix delete mode 100644 makefu/2configs/deployment/rss/sofa.yml (limited to 'makefu') diff --git a/makefu/2configs/deployment/rss/sofa-urls b/makefu/2configs/deployment/rss/sofa-urls deleted file mode 100644 index 70a6c321..00000000 --- a/makefu/2configs/deployment/rss/sofa-urls +++ /dev/null @@ -1 +0,0 @@ -https://www.ebay-kleinanzeigen.de/s-ditzingen/preis::50/sofa/k0l8863r10 diff --git a/makefu/2configs/deployment/rss/sofa.nix b/makefu/2configs/deployment/rss/sofa.nix deleted file mode 100644 index b9180fd4..00000000 --- a/makefu/2configs/deployment/rss/sofa.nix +++ /dev/null @@ -1,26 +0,0 @@ -{ pkgs, lib, config, ... }: -let - fqdn = "rss.euer.krebsco.de"; - ratt-path = "/var/lib/ratt/"; - out-path = "${ratt-path}/sofa.xml"; -in { - systemd.tmpfiles.rules = ["d ${ratt-path} 0750 nginx nginx - -" ]; - systemd.services.run-ratt-sofa = { - enable = true; - path = with pkgs; [ ratt xmlstarlet ]; - script = builtins.readFile ./ratt-hourly.sh; - scriptArgs = "${./sofa-urls} ${out-path}"; - - preStart = "install -v -m750 ${./sofa.yml} ${ratt-path}/sofa.yml"; # ratt requires the config file in the cwd - serviceConfig.User = "nginx"; - serviceConfig.WorkingDirectory = ratt-path; - startAt = "00/3:30"; # every 3 hours, fetch latest - }; - - services.nginx.virtualHosts."${fqdn}" = { - locations."=/ratt/sofa.xml" = { - alias = out-path; - }; - }; -} - diff --git a/makefu/2configs/deployment/rss/sofa.yml b/makefu/2configs/deployment/rss/sofa.yml deleted file mode 100644 index 3248f5c4..00000000 --- a/makefu/2configs/deployment/rss/sofa.yml +++ /dev/null @@ -1,59 +0,0 @@ -regex: https://www.ebay\-kleinanzeigen.de/s\-.* -selectors: - httpsettings: - cookie: {} - header: {} - useragent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) - Chrome/90.0.4430.72 Safari/537.36 - insecure: false - feed: - title: title - authorname: "" - authoremail: "" - item: - container: ul[id='srchrslt-adtable'] li[class='ad-listitem lazyload-item '] - title: | - title = sel:find("h2.text-module-begin"):first():text():gsub("^%s*(.-)%s*$", "%1") - print(title) - link: | - link = sel:find("a"):first():attr("href") - print("https://www.ebay-kleinanzeigen.de" .. link) - created: |- - created = "" - sel:find("div.aditem-main--top--right"):each(function(i, s) - created = s:text():gsub("^%s*(.-)%s*$", "%1") - end) - if created:match("Heute") then - time = created:gsub("^.*,", "") - print(os.date("%d.%m.%Y") .. time .. " CET") - return - end - if created:match("Gestern") then - time = created:gsub("^.*,", "") - print(os.date("%d.%m.%Y", os.time()-24*60*60) .. time .. " CET") - return - end - if created:match("\.") then - print(created .. " 00:00 CET") - return - end - createdformat: 02.01.2006 15:04 MST - description: |- - description = sel:find(".aditem-main--middle"):html() - place = sel:find(".aditem-main--top--left"):html() - print(description .. place) - content: "" - image: | - img = sel:find("div.imagebox"):first():attr("data-imgsrc") - if img ~= "" then - -- prepend host if needed - if not(img:match("https*:\/\/.*")) then - img = "https://www.ebay-kleinanzeigen.de" .. img - end - print(img) - end - nextpage: | - nextpage = sel:find("link[rel=next]"):attr("href") - print("https://www.ebay-kleinanzeigen.de" .. nextpage) - nextpagecount: 5 - sort: "" -- cgit v1.2.3