bmc/main.py

572 lines
22 KiB
Python
Raw Permalink Normal View History

2014-04-25 14:13:37 +02:00
#!/usr/bin/env python2
# -*- coding: utf8 -*-
import argparse
import os
2014-04-24 00:18:49 +02:00
import shutil
import subprocess
import sys
import tempfile
import backend
import fetcher
import tearpages
import tools
import params
2014-04-24 00:18:49 +02:00
from bibtexparser.bparser import BibTexParser
2014-05-09 23:37:17 +02:00
from codecs import open
2014-04-24 00:18:49 +02:00
EDITOR = os.environ.get('EDITOR') if os.environ.get('EDITOR') else 'vim'
2014-04-24 00:18:49 +02:00
2014-05-14 14:53:56 +02:00
def checkBibtex(filename, bibtex_string):
2014-05-02 00:07:49 +02:00
print("The bibtex entry found for "+filename+" is:")
2014-05-14 22:45:25 +02:00
bibtex = BibTexParser(bibtex_string)
2014-04-25 14:13:37 +02:00
bibtex = bibtex.get_entry_dict()
2014-05-15 00:11:56 +02:00
try:
bibtex = bibtex[bibtex.keys()[0]]
print(bibtex_string)
check = tools.rawInput("Is it correct? [Y/n] ")
except:
check = 'n'
2014-05-14 14:53:56 +02:00
try:
old_filename = bibtex['file']
except:
old_filename = False
2014-04-25 14:13:37 +02:00
while check.lower() == 'n':
with tempfile.NamedTemporaryFile(suffix=".tmp") as tmpfile:
2014-05-14 22:45:25 +02:00
tmpfile.write(bibtex_string)
tmpfile.flush()
subprocess.call([EDITOR, tmpfile.name])
tmpfile.seek(0)
2014-05-14 22:45:25 +02:00
bibtex = BibTexParser(tmpfile.read()+"\n")
bibtex = bibtex.get_entry_dict()
2014-05-14 14:53:56 +02:00
try:
bibtex = bibtex[bibtex.keys()[0]]
except:
tools.warning("Invalid bibtex entry")
2014-05-15 00:11:56 +02:00
bibtex_string = ''
tools.rawInput("Press Enter to go back to editor.")
continue
if('authors' not in bibtex and 'title' not in bibtex and 'year' not in
bibtex):
tools.warning("Invalid bibtex entry")
bibtex_string = ''
tools.rawInput("Press Enter to go back to editor.")
continue
if old_filename is not False and 'file' not in bibtex:
tools.warning("Invalid bibtex entry. No filename given.")
tools.rawInput("Press Enter to go back to editor.")
check = 'n'
else:
2014-05-15 00:11:56 +02:00
bibtex_string = tools.parsed2Bibtex(bibtex)
print("\nThe bibtex entry for "+filename+" is:")
print(bibtex_string)
check = tools.rawInput("Is it correct? [Y/n] ")
if old_filename is not False and old_filename != bibtex['file']:
try:
2014-05-14 14:53:56 +02:00
print("Moving file to new location…")
shutil.move(old_filename, bibtex['file'])
except:
tools.warning("Unable to move file "+old_filename+" to " +
bibtex['file']+". You should check it manually.")
2014-05-14 14:53:56 +02:00
return bibtex
2014-05-17 17:23:56 +02:00
def addFile(src, filetype, manual, autoconfirm, tag):
2014-04-24 00:18:49 +02:00
"""
Add a file to the library
"""
2014-05-03 02:16:31 +02:00
doi = False
arxiv = False
isbn = False
2014-05-03 02:16:31 +02:00
if not manual:
if filetype == 'article' or filetype is None:
doi = fetcher.findDOI(src)
if doi is False and (filetype == 'article' or filetype is None):
2014-05-03 02:16:31 +02:00
arxiv = fetcher.findArXivId(src)
if filetype == 'book' or (doi is False and arxiv is False and
filetype is None):
2014-05-03 02:16:31 +02:00
isbn = fetcher.findISBN(src)
2014-05-02 00:07:49 +02:00
if doi is False and isbn is False and arxiv is False:
if filetype is None:
2014-05-02 00:07:49 +02:00
tools.warning("Could not determine the DOI nor the arXiv id nor " +
"the ISBN for "+src+". Switching to manual entry.")
2014-05-02 00:07:49 +02:00
doi_arxiv_isbn = ''
while doi_arxiv_isbn not in ['doi', 'arxiv', 'isbn', 'manual']:
doi_arxiv_isbn = tools.rawInput("DOI / arXiv " +
"/ ISBN / manual? ").lower()
2014-05-02 00:07:49 +02:00
if doi_arxiv_isbn == 'doi':
doi = tools.rawInput('DOI? ')
elif doi_arxiv_isbn == 'arxiv':
arxiv = tools.rawInput('arXiv id? ')
elif doi_arxiv_isbn == 'isbn':
2014-05-02 00:07:49 +02:00
isbn = tools.rawInput('ISBN? ')
elif filetype == 'article':
2014-05-02 00:07:49 +02:00
tools.warning("Could not determine the DOI nor the arXiv id for " +
src+", switching to manual entry.")
doi_arxiv = ''
while doi_arxiv not in ['doi', 'arxiv', 'manual']:
doi_arxiv = tools.rawInput("DOI / arXiv / manual? ").lower()
2014-05-02 00:07:49 +02:00
if doi_arxiv == 'doi':
doi = tools.rawInput('DOI? ')
elif doi_arxiv == 'arxiv':
2014-05-02 00:07:49 +02:00
arxiv = tools.rawInput('arXiv id? ')
elif filetype == 'book':
2014-04-28 22:23:05 +02:00
tools.warning("Could not determine the ISBN for "+src +
", switching to manual entry.")
2014-05-02 00:07:49 +02:00
isbn = tools.rawInput('ISBN? ')
elif doi is not False:
print("DOI for "+src+" is "+doi+".")
2014-05-02 00:07:49 +02:00
elif arxiv is not False:
print("ArXiv id for "+src+" is "+arxiv+".")
elif isbn is not False:
print("ISBN for "+src+" is "+isbn+".")
if doi is not False and doi != '':
2014-04-25 14:13:37 +02:00
# Add extra \n for bibtexparser
bibtex = fetcher.doi2Bib(doi).strip().replace(',', ",\n")+"\n"
2014-05-02 00:07:49 +02:00
elif arxiv is not False and arxiv != '':
bibtex = fetcher.arXiv2Bib(arxiv).strip().replace(',', ",\n")+"\n"
elif isbn is not False and isbn != '':
2014-04-25 14:13:37 +02:00
# Idem
bibtex = fetcher.isbn2Bib(isbn).strip()+"\n"
else:
bibtex = ''
2014-05-14 22:45:25 +02:00
bibtex = BibTexParser(bibtex)
2014-05-14 14:53:56 +02:00
bibtex = bibtex.get_entry_dict()
if len(bibtex) > 0:
bibtex_name = bibtex.keys()[0]
bibtex = bibtex[bibtex_name]
bibtex_string = tools.parsed2Bibtex(bibtex)
else:
bibtex_string = ''
2014-05-17 17:23:56 +02:00
if not autoconfirm:
bibtex = checkBibtex(src, bibtex_string)
if not autoconfirm:
tag = tools.rawInput("Tag for this paper (leave empty for default) ? ")
else:
tag = args.tag
2014-05-05 00:19:29 +02:00
bibtex['tag'] = tag
new_name = backend.getNewName(src, bibtex, tag)
2014-04-24 00:18:49 +02:00
while os.path.exists(new_name):
2014-04-28 22:23:05 +02:00
tools.warning("file "+new_name+" already exists.")
default_rename = new_name.replace(tools.getExtension(new_name),
" (2)"+tools.getExtension(new_name))
2014-05-02 00:07:49 +02:00
rename = tools.rawInput("New name ["+default_rename+"]? ")
if rename == '':
new_name = default_rename
else:
new_name = rename
2014-04-25 15:36:54 +02:00
bibtex['file'] = new_name
2014-04-24 00:18:49 +02:00
try:
shutil.copy2(src, new_name)
except IOError:
new_name = False
sys.exit("Unable to move file to library dir " + params.folder+".")
2014-04-24 00:18:49 +02:00
# Remove first page of IOP papers
2014-05-09 23:37:17 +02:00
try:
if 'IOP' in bibtex['publisher'] and bibtex['type'] == 'article':
tearpages.tearpage(new_name)
except:
pass
backend.bibtexAppend(bibtex)
return new_name
2014-04-24 00:18:49 +02:00
2014-05-05 00:19:29 +02:00
def editEntry(entry, file_id='both'):
2014-05-04 01:50:41 +02:00
bibtex = backend.getBibtex(entry, file_id)
if bibtex is False:
tools.warning("Entry "+entry+" does not exist.")
2014-05-14 14:53:56 +02:00
return False
2014-05-04 01:50:41 +02:00
if file_id == 'file':
filename = entry
else:
filename = bibtex['file']
2014-05-14 14:53:56 +02:00
new_bibtex = checkBibtex(filename, tools.parsed2Bibtex(bibtex))
2014-05-05 00:19:29 +02:00
# Tag update
if new_bibtex['tag'] != bibtex['tag']:
print("Editing tag, moving file.")
new_name = backend.getNewName(new_bibtex['file'],
new_bibtex,
new_bibtex['tag'])
while os.path.exists(new_name):
tools.warning("file "+new_name+" already exists.")
default_rename = new_name.replace(tools.getExtension(new_name),
" (2)" +
tools.getExtension(new_name))
rename = tools.rawInput("New name ["+default_rename+"]? ")
if rename == '':
new_name = default_rename
else:
new_name = rename
new_bibtex['file'] = new_name
try:
shutil.move(bibtex['file'], new_bibtex['file'])
except:
raise Exception('Unable to move file '+bibtex['file']+' to ' +
new_bibtex['file'] + ' according to tag edit.')
try:
if not os.listdir(os.path.dirname(bibtex['file'])):
os.rmdir(os.path.dirname(bibtex['file']))
except:
tools.warning("Unable to delete empty tag dir " +
os.path.dirname(bibtex['file']))
2014-05-04 01:50:41 +02:00
try:
2014-05-09 23:37:17 +02:00
with open(params.folder+'index.bib', 'r', encoding='utf-8') as fh:
2014-05-14 22:45:25 +02:00
index = BibTexParser(fh.read())
2014-05-04 01:50:41 +02:00
index = index.get_entry_dict()
except:
tools.warning("Unable to open index file.")
return False
2014-05-05 00:19:29 +02:00
index[new_bibtex['id']] = new_bibtex
2014-05-04 01:50:41 +02:00
backend.bibtexRewrite(index)
return True
2014-05-17 17:23:56 +02:00
def downloadFile(url, filetype, manual, autoconfirm, tag):
2014-05-09 23:37:17 +02:00
print('Downloading '+url)
2014-04-28 22:23:05 +02:00
dl, contenttype = fetcher.download(url)
2014-04-26 18:40:32 +02:00
if dl is not False:
2014-05-09 23:37:17 +02:00
print('Download finished')
tmp = tempfile.NamedTemporaryFile(suffix='.'+contenttype)
with open(tmp.name, 'w+') as fh:
2014-05-09 23:37:17 +02:00
fh.write(dl)
2014-05-17 17:23:56 +02:00
new_name = addFile(tmp.name, filetype, manual, autoconfirm, tag)
tmp.close()
return new_name
else:
2014-04-28 22:23:05 +02:00
tools.warning("Could not fetch "+url)
return False
def openFile(ident):
try:
2014-05-09 23:37:17 +02:00
with open(params.folder+'index.bib', 'r', encoding='utf-8') as fh:
2014-05-14 22:45:25 +02:00
bibtex = BibTexParser(fh.read())
bibtex = bibtex.get_entry_dict()
except:
tools.warning("Unable to open index file.")
return False
if ident not in bibtex.keys():
return False
else:
subprocess.Popen(['xdg-open', bibtex[ident]['file']])
return True
2014-05-01 00:45:31 +02:00
def resync():
diff = backend.diffFilesIndex()
2014-05-14 17:07:57 +02:00
if diff is False:
return False
for key in diff:
entry = diff[key]
2014-05-01 00:45:31 +02:00
if entry['file'] == '':
2014-05-14 17:07:57 +02:00
print("\nFound entry in index without associated file: " +
entry['id'])
print("Title:\t"+entry['title'])
loop = True
while confirm:
2014-05-01 00:45:31 +02:00
filename = tools.rawInput("File to import for this entry " +
"(leave empty to delete the " +
2014-05-02 00:07:49 +02:00
"entry)? ")
2014-05-01 00:45:31 +02:00
if filename == '':
break
else:
if 'doi' in entry.keys():
doi = fetcher.findDOI(filename)
if doi is not False and doi != entry['doi']:
2014-05-14 17:07:57 +02:00
loop = tools.rawInput("Found DOI does not " +
2014-05-17 17:23:56 +02:00
"match bibtex entry " +
"DOI, continue anyway " +
"? [y/N]")
2014-05-14 17:07:57 +02:00
loop = (loop.lower() != 'y')
2014-05-02 00:07:49 +02:00
if 'Eprint' in entry.keys():
arxiv = fetcher.findArXivId(filename)
if arxiv is not False and arxiv != entry['Eprint']:
2014-05-14 17:07:57 +02:00
loop = tools.rawInput("Found arXiv id does " +
2014-05-17 17:23:56 +02:00
"not match bibtex " +
"entry arxiv id, " +
"continue anyway ? [y/N]")
2014-05-14 17:07:57 +02:00
loop = (loop.lower() != 'y')
if 'isbn' in entry.keys():
2014-05-01 00:45:31 +02:00
isbn = fetcher.findISBN(filename)
if isbn is not False and isbn != entry['isbn']:
2014-05-14 17:07:57 +02:00
loop = tools.rawInput("Found ISBN does not " +
2014-05-17 17:23:56 +02:00
"match bibtex entry " +
"ISBN, continue anyway " +
"? [y/N]")
2014-05-14 17:07:57 +02:00
loop = (loop.lower() != 'y')
2014-05-01 00:45:31 +02:00
continue
if filename == '':
backend.deleteId(entry['id'])
2014-05-14 17:07:57 +02:00
print("Deleted entry \""+entry['id']+"\".")
2014-05-01 00:45:31 +02:00
else:
new_name = backend.getNewName(filename, entry)
try:
shutil.copy2(filename, new_name)
2014-05-14 17:07:57 +02:00
print("Imported new file "+filename+" for entry " +
entry['id']+".")
2014-05-01 00:45:31 +02:00
except IOError:
new_name = False
sys.exit("Unable to move file to library dir " +
params.folder+".")
backend.bibtexEdit(entry['id'], {'file': filename})
else:
2014-05-14 17:07:57 +02:00
print("Found file without any associated entry in index:")
print(entry['file'])
2014-05-01 00:45:31 +02:00
action = ''
while action.lower() not in ['import', 'delete']:
2014-05-02 00:07:49 +02:00
action = tools.rawInput("What to do? [import / delete] ")
2014-05-01 00:45:31 +02:00
action = action.lower()
if action == 'import':
tmp = tempfile.NamedTemporaryFile()
shutil.copy(entry['file'], tmp.name)
filetype = tools.getExtension(entry['file'])
try:
os.remove(entry['file'])
except:
tools.warning("Unable to delete file "+entry['file'])
if not addFile(tmp.name, filetype):
tools.warning("Unable to reimport file "+entry['file'])
tmp.close()
else:
backend.deleteFile(entry['file'])
print(entry['file'] + " removed from disk and " +
"index.")
2014-05-05 00:19:29 +02:00
# Check for empty tag dirs
for i in os.listdir(params.folder):
if os.path.isdir(i) and not os.listdir(params.folder + i):
try:
os.rmdir(params.folder + i)
except:
tools.warning("Found empty tag dir "+params.folder + i +
" but could not delete it.")
2014-05-01 00:45:31 +02:00
2014-05-14 22:45:25 +02:00
def update(entry):
2014-05-07 22:04:46 +02:00
update = backend.updateArXiv(entry)
if update is not False:
print("New version found for "+entry)
2014-05-14 22:45:25 +02:00
print("\t Title: "+update['title'])
confirm = tools.rawInput("Download it ? [Y/n] ")
if confirm.lower() == 'n':
return
new_name = downloadFile('http://arxiv.org/pdf/'+update['eprint'],
'article', False)
if new_name is not False:
print(update['eprint']+" successfully imported as "+new_name)
else:
tools.warning("An error occurred while downloading "+url)
confirm = tools.rawInput("Delete previous version ? [y/N] ")
if confirm.lower() == 'y':
if not backend.deleteId(entry):
if not backend.deleteFile(entry):
tools.warning("Unable to remove previous version.")
return
print("Previous version successfully deleted.")
2014-05-07 22:04:46 +02:00
2014-04-24 00:18:49 +02:00
if __name__ == '__main__':
parser = argparse.ArgumentParser(description="A bibliography " +
"management tool.")
subparsers = parser.add_subparsers(help="sub-command help")
parser_download = subparsers.add_parser('download', help="download help")
parser_download.add_argument('-t', '--type', default=None,
choices=['article', 'book'],
2014-05-03 02:16:31 +02:00
help="type of the file to download")
parser_download.add_argument('-m', '--manual', default=False,
action='store_true',
help="disable auto-download of bibtex")
2014-05-17 17:23:56 +02:00
parser_download.add_argument('-y', default=False,
help="Confirm all")
parser_download.add_argument('--tag', default='', help="Tag")
parser_download.add_argument('url', nargs='+',
help="url of the file to import")
parser_download.set_defaults(func='download')
parser_import = subparsers.add_parser('import', help="import help")
parser_import.add_argument('-t', '--type', default=None,
choices=['article', 'book'],
2014-05-03 02:16:31 +02:00
help="type of the file to import")
parser_import.add_argument('-m', '--manual', default=False,
action='store_true',
help="disable auto-download of bibtex")
2014-05-17 17:23:56 +02:00
parser_import.add_argument('-y', default=False,
help="Confirm all")
parser_import.add_argument('--tag', default='', help="Tag")
parser_import.add_argument('file', nargs='+',
help="path to the file to import")
parser_import.add_argument('--skip', nargs='+',
help="path to files to skip")
parser_import.set_defaults(func='import')
parser_delete = subparsers.add_parser('delete', help="delete help")
2014-05-04 01:50:41 +02:00
parser_delete.add_argument('entries', metavar='entry', nargs='+',
help="a filename or an identifier")
parser_delete.add_argument('--skip', nargs='+',
help="path to files to skip")
2014-05-04 01:50:41 +02:00
group = parser_delete.add_mutually_exclusive_group()
group.add_argument('--id', action="store_true", default=False,
2014-05-05 00:19:29 +02:00
help="id based deletion")
2014-05-04 01:50:41 +02:00
group.add_argument('--file', action="store_true", default=False,
2014-05-05 00:19:29 +02:00
help="file based deletion")
2014-05-03 02:16:31 +02:00
parser_delete.add_argument('-f', '--force', default=False,
action='store_true',
help="delete without confirmation")
parser_delete.set_defaults(func='delete')
2014-05-05 00:19:29 +02:00
2014-05-04 01:50:41 +02:00
parser_edit = subparsers.add_parser('edit', help="edit help")
parser_edit.add_argument('entries', metavar='entry', nargs='+',
2014-05-05 00:19:29 +02:00
help="a filename or an identifier")
parser_edit.add_argument('--skip', nargs='+',
2014-05-17 17:23:56 +02:00
help="path to files to skip")
2014-05-04 01:50:41 +02:00
group = parser_edit.add_mutually_exclusive_group()
group.add_argument('--id', action="store_true", default=False,
2014-05-05 00:19:29 +02:00
help="id based deletion")
2014-05-04 01:50:41 +02:00
group.add_argument('--file', action="store_true", default=False,
2014-05-05 00:19:29 +02:00
help="file based deletion")
2014-05-04 01:50:41 +02:00
parser_edit.set_defaults(func='edit')
parser_list = subparsers.add_parser('list', help="list help")
parser_list.set_defaults(func='list')
parser_search = subparsers.add_parser('search', help="search help")
parser_search.set_defaults(func='search')
parser_open = subparsers.add_parser('open', help="open help")
parser_open.add_argument('ids', metavar='id', nargs='+',
help="an identifier")
parser_open.set_defaults(func='open')
parser_resync = subparsers.add_parser('resync', help="resync help")
parser_resync.set_defaults(func='resync')
2014-05-07 22:04:46 +02:00
parser_update = subparsers.add_parser('update', help="update help")
2014-05-09 23:50:19 +02:00
parser_update.add_argument('--entries', metavar='entry', nargs='+',
2014-05-07 22:04:46 +02:00
help="a filename or an identifier")
parser_update.set_defaults(func='update')
parser_search = subparsers.add_parser('search', help="search help")
2014-05-09 23:50:19 +02:00
parser_search.add_argument('query', metavar='entry', nargs='+',
help="your query, see README for more info.")
parser_search.set_defaults(func='search')
args = parser.parse_args()
try:
if args.func == 'download':
for url in args.url:
2014-05-17 17:23:56 +02:00
new_name = downloadFile(url, args.type, args.manual, args.y,
args.tag)
if new_name is not False:
print(url+" successfully imported as "+new_name)
else:
tools.warning("An error occurred while downloading "+url)
sys.exit()
2014-04-24 00:18:49 +02:00
if args.func == 'import':
for filename in list(set(args.file) - set(args.skip)):
2014-05-17 17:23:56 +02:00
new_name = addFile(filename, args.type, args.manual, args.y,
args.tag)
if new_name is not False:
print(sys.argv[2]+" successfully imported as " +
new_name+".")
else:
tools.warning("An error occurred while importing " +
filename)
sys.exit()
2014-04-24 00:18:49 +02:00
elif args.func == 'delete':
for filename in list(set(args.entries) - set(args.skip)):
2014-05-03 02:16:31 +02:00
if not args.force:
confirm = tools.rawInput("Are you sure you want to " +
"delete "+filename+" ? [y/N] ")
else:
confirm = 'y'
2014-04-25 15:36:54 +02:00
if confirm.lower() == 'y':
2014-05-04 01:50:41 +02:00
if args.file or not backend.deleteId(filename):
if args.id or not backend.deleteFile(filename):
tools.warning("Unable to delete "+filename)
sys.exit(1)
2014-04-25 15:36:54 +02:00
print(filename+" successfully deleted.")
2014-04-25 15:36:54 +02:00
sys.exit()
2014-04-25 14:22:34 +02:00
2014-05-09 23:50:57 +02:00
elif args.func == 'edit':
for filename in list(set(args.entries) - set(args.skip)):
2014-05-04 01:50:41 +02:00
if args.file:
file_id = 'file'
elif args.id:
file_id = 'id'
else:
file_id = 'both'
editEntry(filename, file_id)
sys.exit()
elif args.func == 'list':
2014-05-14 22:52:17 +02:00
listPapers = tools.listDir(params.folder)
listPapers.sort()
for paper in listPapers:
if tools.getExtension(paper) not in [".pdf", ".djvu"]:
continue
print(paper)
2014-04-24 00:18:49 +02:00
elif args.func == 'search':
raise Exception('TODO')
2014-04-25 15:36:54 +02:00
elif args.func == 'open':
for filename in args.ids:
2014-05-02 22:08:24 +02:00
if not openFile(filename):
sys.exit("Unable to open file associated " +
"to ident "+filename)
2014-05-04 01:50:41 +02:00
sys.exit()
elif args.func == 'resync':
2014-05-02 00:07:49 +02:00
confirm = tools.rawInput("Resync files and bibtex index? [y/N] ")
2014-05-01 00:45:31 +02:00
if confirm.lower() == 'y':
resync()
2014-05-04 01:50:41 +02:00
sys.exit()
2014-05-01 00:45:31 +02:00
2014-05-07 22:04:46 +02:00
elif args.func == 'update':
if args.entries is None:
entries = backend.getEntries()
else:
entries = args.entries
for entry in entries:
update(entry)
sys.exit()
except KeyboardInterrupt:
sys.exit()