From 804356a1393acc8ad27c856829979a2cc4a9663a Mon Sep 17 00:00:00 2001 From: ColumbusUtrigas Date: Thu, 18 Aug 2022 07:41:44 +0400 Subject: [PATCH] nvidia research parser --- app.py | 12 ++++++++++++ parsers/nvidia.py | 27 +++++++++++++++++++++++++++ 2 files changed, 39 insertions(+) create mode 100644 app.py create mode 100644 parsers/nvidia.py diff --git a/app.py b/app.py new file mode 100644 index 0000000..6f0e41a --- /dev/null +++ b/app.py @@ -0,0 +1,12 @@ +from flask import Flask, Response +from parsers.nvidia import * + +app = Flask(__name__) + +@app.route("/") +def index(): + return "

Hello, World!

" + +@app.route("/nvidia") +def rss_query(): + return Response(parseNvidia(), mimetype='text/xml') diff --git a/parsers/nvidia.py b/parsers/nvidia.py new file mode 100644 index 0000000..66d8131 --- /dev/null +++ b/parsers/nvidia.py @@ -0,0 +1,27 @@ +from pyquery import PyQuery as pq +from feedgen.feed import FeedGenerator + +def parseNvidia(): + root_url = 'https://research.nvidia.com' + d = pq(root_url +'/publications') + + fg = FeedGenerator() + fg.id(root_url) + fg.title('NVidia Research') + fg.link(href=root_url, rel='alternate') + fg.logo(root_url + '/favicon.ico') + fg.description('NVidia Research papers') + + for elem in d('.views-field-title').items(): + link = elem.find('a') + url = root_url + link.attr.href + title = link.text() + + fe = fg.add_entry() + fe.id(url) + fe.title(title) + fe.link(href=url) + + return fg.rss_str() + +