diff options
| author | Gertjan van den Burg <gertjanvandenburg@gmail.com> | 2019-02-08 17:39:58 +0000 |
|---|---|---|
| committer | Gertjan van den Burg <gertjanvandenburg@gmail.com> | 2019-02-08 17:39:58 +0000 |
| commit | cc3bceb78a94f4c8377468ed585bff93b71bada0 (patch) | |
| tree | 2cbff4578af29cb2beabfaba39f4c907a757d041 | |
| parent | Formatting (diff) | |
| download | paper2remarkable-cc3bceb78a94f4c8377468ed585bff93b71bada0.tar.gz paper2remarkable-cc3bceb78a94f4c8377468ed585bff93b71bada0.zip | |
Also update dearxiv function for older papers
| -rwxr-xr-x | arxiv2remarkable.py | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/arxiv2remarkable.py b/arxiv2remarkable.py index 7a2f144..6bb88fc 100755 --- a/arxiv2remarkable.py +++ b/arxiv2remarkable.py @@ -123,13 +123,13 @@ def dearxiv(input_file, pdftk_path="pdftk"): data = fid.read() # Remove the text element data = re.sub( - b"\(arXiv:\d{4}\.\d{5}v\d\s+\[\w+\.\w+\]\s+\d{1,2}\s\w{3}\s\d{4}\)Tj", + b"\(arXiv:\d{4}\.\d{4,5}v\d\s+\[\w+\.\w+\]\s+\d{1,2}\s\w{3}\s\d{4}\)Tj", b"()Tj", data, ) # Remove the URL element data = re.sub( - b"<<\\n\/URI \(http://arxiv\.org/abs/\d{4}\.\d{5}v\d\)\\n\/S /URI\\n>>\\n", + b"<<\\n\/URI \(http://arxiv\.org/abs/\d{4}\.\d{4,5}v\d\)\\n\/S /URI\\n>>\\n", b"", data, ) |
