Skip to content

Commit 5460c72

Browse files
committed
Fix bug with arxiv links
1 parent 3313775 commit 5460c72

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

download.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -32,16 +32,17 @@ def clean_header(text):
3232
if point.name == 'h1':
3333
level1_directory = os.path.join('pdfs', clean_header(point.text))
3434
os.makedirs(level1_directory)
35-
print('\n'.join((point.text, "+" * len(point.text), "")))
35+
print('\n'.join(("", point.text, "+" * len(point.text))))
3636

3737
elif point.name == 'h2':
3838
current_directory = os.path.join(level1_directory, clean_header(point.text))
3939
os.mkdir(current_directory)
40-
print('\n'.join((point.text, "+" * len(point.text), "")))
40+
print('\n'.join(("", point.text, "-" * len(point.text))))
4141

4242
elif point.name == 'p':
4343
link = clean_pdf_link(point.find('a').attrs['href'])
4444
extension = os.path.splitext(link)[1][1:]
45+
extension = 'pdf' if extension not in ['pdf', 'html'] else extension
4546
name = point.text.split('[' + extension + ']')[0].replace('.', '').replace('/', '_')
4647
if link is not None:
4748
print(name + ' (' + link + ')')

0 commit comments

Comments
 (0)