jzhang
4/2/2018 - 1:07 PM

download arxiv pdf files

download arxiv pdf files

import pyarxiv as paq
from pyarxiv.arxiv_categories import ArxivCategory
import pprint

qstrings = ['GDPR', 'data protection', 'stream', 'pipeline']
posts = []
for qs in qstrings:
    items = paq.query(max_results=200, querystring=qs)
    for i in range(0, len(items)):
        posts.append({
            'title': items[i].title,
            'description': items[i].summary,
            'url': items[i].link,
        })
pprint.pprint(posts)
import feedparser
import pprint
import json

feed = feedparser.parse('http://export.arxiv.org/rss/cs')
posts = []
for i in range(0, len(feed['entries'])):
    posts.append({
        'title': feed['entries'][i].title,
        'description': feed['entries'][i].summary,
        'url': feed['entries'][i].link,
    })
pprint.pprint(posts)